hubgit · September 3, 2025 18:33 · dragon-dxw · Sep 3, 2025
diff --git a/README.md b/README.md
diff --git a/pdftk-unset-info-dictionary-values.php b/pdftk-unset-info-dictionary-values.php
 <?php

 $file = 'example.pdf';

 // get the current metadata
 $command = sprintf('pdftk %s dump_data', escapeshellarg($file));
 $output = array(); $return = null; exec($command, $output, $return);

 //print_r($output);

 if ($return) {
    throw new Exception('There was an error reading metadata from the PDF file');
 }

 // set any metadata values to null
 foreach ($output as $index => $line) {
    if (strpos($line, 'InfoValue:') === 0) {
        $output[$index] = 'InfoValue:';
    }
 }

 // write the updated metadata to a file
 $metadataFile = tempnam(sys_get_temp_dir(), 'pdf-meta-');
 file_put_contents($metadataFile, implode("\n", $output));

 // create a new PDF using the updated metadata
 $tmpFile = tempnam(sys_get_temp_dir(), 'pdf-tmp-');
 $command = sprintf('pdftk %s update_info %s output %s',
    escapeshellarg($file), escapeshellarg($metadataFile), escapeshellarg($tmpFile));
 $output = array(); $return = null; exec($command, $output, $return);

 if ($return) {
    throw new Exception('There was an error writing metadata to the PDF file');
 }

 // clean up the temporary files
 rename($tmpFile, $file);
 unlink($metadataFile);
diff --git a/remove-pdf-metadata.sh b/remove-pdf-metadata.sh
 #!/bin/bash

 FILE=example.pdf

 # read tags from the original PDF
 #exiftool -all:all $FILE

 # remove tags (XMP + metadata) from the PDF
 exiftool -all:all= $FILE

 # linearize the file to remove orphan data
 qpdf --linearize $FILE

 # read XMP from the modified PDF
 #exiftool -all:all $FILE

 # read all strings from the modified PDF
 #cat $FILE | strings > $FILE.txt

 # read XMP from embedded objects in the modified PDF
 #exiftool -extractEmbedded -all:all $FILE
	<?php

	$file = 'example.pdf';

	// get the current metadata
	$command = sprintf('pdftk %s dump_data', escapeshellarg($file));
	$output = array(); $return = null; exec($command, $output, $return);

	//print_r($output);

	if ($return) {
	throw new Exception('There was an error reading metadata from the PDF file');
	}

	// set any metadata values to null
	foreach ($output as $index => $line) {
	if (strpos($line, 'InfoValue:') === 0) {
	$output[$index] = 'InfoValue:';
	}
	}

	// write the updated metadata to a file
	$metadataFile = tempnam(sys_get_temp_dir(), 'pdf-meta-');
	file_put_contents($metadataFile, implode("\n", $output));

	// create a new PDF using the updated metadata
	$tmpFile = tempnam(sys_get_temp_dir(), 'pdf-tmp-');
	$command = sprintf('pdftk %s update_info %s output %s',
	escapeshellarg($file), escapeshellarg($metadataFile), escapeshellarg($tmpFile));
	$output = array(); $return = null; exec($command, $output, $return);

	if ($return) {
	throw new Exception('There was an error writing metadata to the PDF file');
	}

	// clean up the temporary files
	rename($tmpFile, $file);
	unlink($metadataFile);