<?xml version="1.0"?>
<feed xmlns="http://www.w3.org/2005/Atom" xml:lang="en">
	<id>https://wiki.docgyver.com/index.php?action=history&amp;feed=atom&amp;title=PDF_Notes</id>
	<title>PDF Notes - Revision history</title>
	<link rel="self" type="application/atom+xml" href="https://wiki.docgyver.com/index.php?action=history&amp;feed=atom&amp;title=PDF_Notes"/>
	<link rel="alternate" type="text/html" href="https://wiki.docgyver.com/index.php?title=PDF_Notes&amp;action=history"/>
	<updated>2026-04-18T13:40:32Z</updated>
	<subtitle>Revision history for this page on the wiki</subtitle>
	<generator>MediaWiki 1.38.2</generator>
	<entry>
		<id>https://wiki.docgyver.com/index.php?title=PDF_Notes&amp;diff=204&amp;oldid=prev</id>
		<title>DocGyver at 14:04, 10 December 2021</title>
		<link rel="alternate" type="text/html" href="https://wiki.docgyver.com/index.php?title=PDF_Notes&amp;diff=204&amp;oldid=prev"/>
		<updated>2021-12-10T14:04:03Z</updated>

		<summary type="html">&lt;p&gt;&lt;/p&gt;
&lt;table style=&quot;background-color: #fff; color: #202122;&quot; data-mw=&quot;interface&quot;&gt;
				&lt;col class=&quot;diff-marker&quot; /&gt;
				&lt;col class=&quot;diff-content&quot; /&gt;
				&lt;col class=&quot;diff-marker&quot; /&gt;
				&lt;col class=&quot;diff-content&quot; /&gt;
				&lt;tr class=&quot;diff-title&quot; lang=&quot;en&quot;&gt;
				&lt;td colspan=&quot;2&quot; style=&quot;background-color: #fff; color: #202122; text-align: center;&quot;&gt;← Older revision&lt;/td&gt;
				&lt;td colspan=&quot;2&quot; style=&quot;background-color: #fff; color: #202122; text-align: center;&quot;&gt;Revision as of 14:04, 10 December 2021&lt;/td&gt;
				&lt;/tr&gt;&lt;tr&gt;&lt;td colspan=&quot;2&quot; class=&quot;diff-lineno&quot; id=&quot;mw-diff-left-l35&quot;&gt;Line 35:&lt;/td&gt;
&lt;td colspan=&quot;2&quot; class=&quot;diff-lineno&quot;&gt;Line 35:&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class=&quot;diff-marker&quot;&gt;&lt;/td&gt;&lt;td style=&quot;background-color: #f8f9fa; color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #eaecf0; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&amp;lt;pre&amp;gt;&lt;/div&gt;&lt;/td&gt;&lt;td class=&quot;diff-marker&quot;&gt;&lt;/td&gt;&lt;td style=&quot;background-color: #f8f9fa; color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #eaecf0; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&amp;lt;pre&amp;gt;&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class=&quot;diff-marker&quot;&gt;&lt;/td&gt;&lt;td style=&quot;background-color: #f8f9fa; color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #eaecf0; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;find . -regextype posix-extended  -regex &amp;quot;.*/[0-9]{8}_[0-9]{6}.*&amp;quot; -exec rename -v 's/(\d{4})(\d{2})(\d{2})_(\d{2})(\d{2})(\d{2})/$1-$2-$3_$4.$5.$6/' {} \;&lt;/div&gt;&lt;/td&gt;&lt;td class=&quot;diff-marker&quot;&gt;&lt;/td&gt;&lt;td style=&quot;background-color: #f8f9fa; color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #eaecf0; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;find . -regextype posix-extended  -regex &amp;quot;.*/[0-9]{8}_[0-9]{6}.*&amp;quot; -exec rename -v 's/(\d{4})(\d{2})(\d{2})_(\d{2})(\d{2})(\d{2})/$1-$2-$3_$4.$5.$6/' {} \;&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td colspan=&quot;2&quot; class=&quot;diff-side-deleted&quot;&gt;&lt;/td&gt;&lt;td class=&quot;diff-marker&quot; data-marker=&quot;+&quot;&gt;&lt;/td&gt;&lt;td style=&quot;color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #a3d3ff; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&lt;ins style=&quot;font-weight: bold; text-decoration: none;&quot;&gt;&amp;lt;/pre&gt;&lt;/ins&gt;&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td colspan=&quot;2&quot; class=&quot;diff-side-deleted&quot;&gt;&lt;/td&gt;&lt;td class=&quot;diff-marker&quot; data-marker=&quot;+&quot;&gt;&lt;/td&gt;&lt;td style=&quot;color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #a3d3ff; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&lt;ins style=&quot;font-weight: bold; text-decoration: none;&quot;&gt;=Bash Script for processing scans=&lt;/ins&gt;&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td colspan=&quot;2&quot; class=&quot;diff-side-deleted&quot;&gt;&lt;/td&gt;&lt;td class=&quot;diff-marker&quot; data-marker=&quot;+&quot;&gt;&lt;/td&gt;&lt;td style=&quot;color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #a3d3ff; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&lt;ins style=&quot;font-weight: bold; text-decoration: none;&quot;&gt;&amp;lt;pre&gt;&lt;/ins&gt;&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td colspan=&quot;2&quot; class=&quot;diff-side-deleted&quot;&gt;&lt;/td&gt;&lt;td class=&quot;diff-marker&quot; data-marker=&quot;+&quot;&gt;&lt;/td&gt;&lt;td style=&quot;color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #a3d3ff; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&lt;ins style=&quot;font-weight: bold; text-decoration: none;&quot;&gt;cd &amp;lt;sourcefolder&gt;&lt;/ins&gt;&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td colspan=&quot;2&quot; class=&quot;diff-side-deleted&quot;&gt;&lt;/td&gt;&lt;td class=&quot;diff-marker&quot; data-marker=&quot;+&quot;&gt;&lt;/td&gt;&lt;td style=&quot;color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #a3d3ff; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&lt;ins style=&quot;font-weight: bold; text-decoration: none;&quot;&gt;tiffcp &amp;lt;list of tif files&gt; &amp;lt;output.pdf&gt;&lt;/ins&gt;&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td colspan=&quot;2&quot; class=&quot;diff-side-deleted&quot;&gt;&lt;/td&gt;&lt;td class=&quot;diff-marker&quot; data-marker=&quot;+&quot;&gt;&lt;/td&gt;&lt;td style=&quot;color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #a3d3ff; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&lt;ins style=&quot;font-weight: bold; text-decoration: none;&quot;&gt;cp &amp;lt;output.pdf&gt; //wormhole/Media/OCRMyPDF/Input&lt;/ins&gt;&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td colspan=&quot;2&quot; class=&quot;diff-side-deleted&quot;&gt;&lt;/td&gt;&lt;td class=&quot;diff-marker&quot; data-marker=&quot;+&quot;&gt;&lt;/td&gt;&lt;td style=&quot;color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #a3d3ff; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&lt;ins style=&quot;font-weight: bold; text-decoration: none;&quot;&gt;cp //wormhole/Media/OCRMyPDF/Output/&amp;lt;output.pdf&gt; &amp;lt;destination folder&gt;&lt;/ins&gt;&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class=&quot;diff-marker&quot;&gt;&lt;/td&gt;&lt;td style=&quot;background-color: #f8f9fa; color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #eaecf0; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&amp;lt;/pre&amp;gt;&lt;/div&gt;&lt;/td&gt;&lt;td class=&quot;diff-marker&quot;&gt;&lt;/td&gt;&lt;td style=&quot;background-color: #f8f9fa; color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #eaecf0; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&amp;lt;/pre&amp;gt;&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;/table&gt;</summary>
		<author><name>DocGyver</name></author>
	</entry>
	<entry>
		<id>https://wiki.docgyver.com/index.php?title=PDF_Notes&amp;diff=189&amp;oldid=prev</id>
		<title>DocGyver: Created page with &quot;  =References= * https://medium.com/@kaerumy/cleaning-up-scanned-documents-with-open-source-tools-9d87e15305b * https://github.com/scantailor/scantailor/wiki/Split-Pages * htt...&quot;</title>
		<link rel="alternate" type="text/html" href="https://wiki.docgyver.com/index.php?title=PDF_Notes&amp;diff=189&amp;oldid=prev"/>
		<updated>2020-08-08T15:28:14Z</updated>

		<summary type="html">&lt;p&gt;Created page with &amp;quot;  =References= * https://medium.com/@kaerumy/cleaning-up-scanned-documents-with-open-source-tools-9d87e15305b * https://github.com/scantailor/scantailor/wiki/Split-Pages * htt...&amp;quot;&lt;/p&gt;
&lt;p&gt;&lt;b&gt;New page&lt;/b&gt;&lt;/p&gt;&lt;div&gt;&lt;br /&gt;
&lt;br /&gt;
=References=&lt;br /&gt;
* https://medium.com/@kaerumy/cleaning-up-scanned-documents-with-open-source-tools-9d87e15305b&lt;br /&gt;
* https://github.com/scantailor/scantailor/wiki/Split-Pages&lt;br /&gt;
* http://www.tobias-elze.de/pdfsandwich/&lt;br /&gt;
&lt;br /&gt;
* https://www.howtogeek.com/197195/how-to-remove-a-password-from-a-pdf-file-in-linux/&lt;br /&gt;
* https://stackoverflow.com/questions/36270555/open-a-pdf-with-blank-password-with-pdftk&lt;br /&gt;
&lt;br /&gt;
* https://www.howtogeek.com/228796/how-to-extract-and-save-images-from-a-pdf-file-in-linux/&lt;br /&gt;
* https://ocrmypdf.readthedocs.io/en/latest/cookbook.html&lt;br /&gt;
* https://www.onetransistor.eu/2015/12/ocr-searchable-pdf-linux.html ==&lt;br /&gt;
&lt;br /&gt;
=Bash Script for converting Magazine=&lt;br /&gt;
&amp;lt;pre&amp;gt;&lt;br /&gt;
for fn in *.pdf ; do&lt;br /&gt;
	echo $fn&lt;br /&gt;
	#Cleanup from prior runs&lt;br /&gt;
	rm -f tmp/images*tif&lt;br /&gt;
	#Split pdf pages into individual tif files&lt;br /&gt;
	pdfimages -tiff &amp;quot;$fn&amp;quot; ./tmp/images&lt;br /&gt;
&lt;br /&gt;
	#combine into a single tif file&lt;br /&gt;
	tiffcp tmp/images*tif $(basename &amp;quot;$fn&amp;quot; .pdf).tif&lt;br /&gt;
&lt;br /&gt;
	####put combined TIF into docker folder for OCRMyPDF and wait for output&lt;br /&gt;
&lt;br /&gt;
	#&lt;br /&gt;
	tiff2pdf -o ../../../OCRMyPDF/Input/$fn $(basename &amp;quot;$fn&amp;quot; .pdf).tif&lt;br /&gt;
done&lt;br /&gt;
rm tmp/images*tif&lt;br /&gt;
&amp;lt;/pre&amp;gt;&lt;br /&gt;
=Bash command to rename yyyymmdd_hhmmss to yyyy-mm-dd_hh.mm.ss=&lt;br /&gt;
&amp;lt;pre&amp;gt;&lt;br /&gt;
find . -regextype posix-extended  -regex &amp;quot;.*/[0-9]{8}_[0-9]{6}.*&amp;quot; -exec rename -v 's/(\d{4})(\d{2})(\d{2})_(\d{2})(\d{2})(\d{2})/$1-$2-$3_$4.$5.$6/' {} \;&lt;br /&gt;
&amp;lt;/pre&amp;gt;&lt;/div&gt;</summary>
		<author><name>DocGyver</name></author>
	</entry>
</feed>