<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: ReadPDFFile V2 gives error when reading PDF file in Cortex XSOAR Discussions</title>
    <link>https://live.paloaltonetworks.com/t5/cortex-xsoar-discussions/readpdffile-v2-gives-error-when-reading-pdf-file/m-p/464484#M551</link>
    <description>&lt;P&gt;Do other PDFs with the same PDF version work with&amp;nbsp;&lt;SPAN&gt;ReadPDFFileV2&amp;nbsp;?&lt;/SPAN&gt;&lt;/P&gt;</description>
    <pubDate>Wed, 09 Feb 2022 12:54:48 GMT</pubDate>
    <dc:creator>jwilkes</dc:creator>
    <dc:date>2022-02-09T12:54:48Z</dc:date>
    <item>
      <title>ReadPDFFile V2 gives error when reading PDF file</title>
      <link>https://live.paloaltonetworks.com/t5/cortex-xsoar-discussions/readpdffile-v2-gives-error-when-reading-pdf-file/m-p/464408#M548</link>
      <description>&lt;P&gt;Hi everyone,&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I was trying to make a playbook to extract indicators (Hash values, domains, IP addresses) from a PDF file. I tried to use the ReadPDFFile V2 utility, however it gives the below error on 2 of the PDF files I tried.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;DIV class=""&gt;&lt;DIV class=""&gt;&lt;DIV class=""&gt;&lt;DIV class=""&gt;&lt;STRONG&gt;&lt;SPAN&gt;Command:&lt;/SPAN&gt;&lt;/STRONG&gt;&amp;nbsp;&lt;DIV class=""&gt;&lt;SPAN class=""&gt;!ReadPDFFileV2 entryID="29@14" maxImages="20" auto-extract="inline"&lt;/SPAN&gt;&lt;SPAN class=""&gt;(Scripts)&lt;/SPAN&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;DIV class=""&gt;&lt;DIV class=""&gt;&lt;DIV&gt;&lt;SPAN class=""&gt;&lt;STRONG&gt;&lt;SPAN&gt;Reason&lt;/SPAN&gt;&lt;/STRONG&gt;&lt;/SPAN&gt;&lt;DIV class=""&gt;&lt;DIV&gt;&lt;DIV class=""&gt;&lt;SPAN class=""&gt;Could not load pdf file in EntryID 29@14 Error: '&lt;A href="http://www.w3.org/1999/xhtml" target="_blank" rel="noopener"&gt;http://www.w3.org/1999/xhtml&lt;/A&gt;'&lt;/SPAN&gt;&lt;/DIV&gt;&lt;DIV class=""&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV class=""&gt;&lt;SPAN class=""&gt;Any idea how I can resolve this?&lt;/SPAN&gt;&lt;/DIV&gt;&lt;DIV class=""&gt;&lt;SPAN class=""&gt;I though it was the PDF version at first (the original file is 1.5), so i tried converting to v1.8 and still it failed.&lt;/SPAN&gt;&lt;/DIV&gt;&lt;DIV class=""&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV class=""&gt;&lt;SPAN class=""&gt;Thanks in advance.&lt;/SPAN&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;</description>
      <pubDate>Wed, 09 Feb 2022 10:59:07 GMT</pubDate>
      <guid>https://live.paloaltonetworks.com/t5/cortex-xsoar-discussions/readpdffile-v2-gives-error-when-reading-pdf-file/m-p/464408#M548</guid>
      <dc:creator>pottapitot</dc:creator>
      <dc:date>2022-02-09T10:59:07Z</dc:date>
    </item>
    <item>
      <title>Re: ReadPDFFile V2 gives error when reading PDF file</title>
      <link>https://live.paloaltonetworks.com/t5/cortex-xsoar-discussions/readpdffile-v2-gives-error-when-reading-pdf-file/m-p/464470#M549</link>
      <description>&lt;P&gt;Good morning, is&amp;nbsp;&lt;SPAN&gt;'&lt;/SPAN&gt;&lt;A href="https://urldefense.proofpoint.com/v2/url?u=http-3A__www.w3.org_1999_xhtml&amp;amp;d=DwMFaQ&amp;amp;c=V9IgWpI5PvzTw83UyHGVSoW3Uc1MFWe5J8PTfkrzVSo&amp;amp;r=hk6f12QwQXt8CXDuWpGG0HjiB1o9z-RBhoeZw7sw6sA&amp;amp;m=IGJR29YWKBlG2FfrANYog3aExjp9v80yMXbDyf_As64kbKQwHQ8x9vnhNlpmXx3L&amp;amp;s=crfzZCF9Ij8dvBLzT6HD8KQTRtPBft7McyGSVX6j8d0&amp;amp;e=" target="_blank" rel="noopener nofollow noreferrer"&gt;http://www.w3.org/1999/xhtml&lt;/A&gt;&lt;SPAN&gt;' an indicator inside the PDF?&lt;/SPAN&gt;&lt;/P&gt;</description>
      <pubDate>Wed, 09 Feb 2022 12:40:19 GMT</pubDate>
      <guid>https://live.paloaltonetworks.com/t5/cortex-xsoar-discussions/readpdffile-v2-gives-error-when-reading-pdf-file/m-p/464470#M549</guid>
      <dc:creator>jwilkes</dc:creator>
      <dc:date>2022-02-09T12:40:19Z</dc:date>
    </item>
    <item>
      <title>Re: ReadPDFFile V2 gives error when reading PDF file</title>
      <link>https://live.paloaltonetworks.com/t5/cortex-xsoar-discussions/readpdffile-v2-gives-error-when-reading-pdf-file/m-p/464480#M550</link>
      <description>&lt;P&gt;Hi&amp;nbsp;&lt;a href="https://live.paloaltonetworks.com/t5/user/viewprofilepage/user-id/166751"&gt;@jwilkes&lt;/a&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;It is not present in the file. There are 2 other domains not related to this and a couple of hashes and CVE.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Wed, 09 Feb 2022 12:52:51 GMT</pubDate>
      <guid>https://live.paloaltonetworks.com/t5/cortex-xsoar-discussions/readpdffile-v2-gives-error-when-reading-pdf-file/m-p/464480#M550</guid>
      <dc:creator>pottapitot</dc:creator>
      <dc:date>2022-02-09T12:52:51Z</dc:date>
    </item>
    <item>
      <title>Re: ReadPDFFile V2 gives error when reading PDF file</title>
      <link>https://live.paloaltonetworks.com/t5/cortex-xsoar-discussions/readpdffile-v2-gives-error-when-reading-pdf-file/m-p/464484#M551</link>
      <description>&lt;P&gt;Do other PDFs with the same PDF version work with&amp;nbsp;&lt;SPAN&gt;ReadPDFFileV2&amp;nbsp;?&lt;/SPAN&gt;&lt;/P&gt;</description>
      <pubDate>Wed, 09 Feb 2022 12:54:48 GMT</pubDate>
      <guid>https://live.paloaltonetworks.com/t5/cortex-xsoar-discussions/readpdffile-v2-gives-error-when-reading-pdf-file/m-p/464484#M551</guid>
      <dc:creator>jwilkes</dc:creator>
      <dc:date>2022-02-09T12:54:48Z</dc:date>
    </item>
    <item>
      <title>Re: ReadPDFFile V2 gives error when reading PDF file</title>
      <link>https://live.paloaltonetworks.com/t5/cortex-xsoar-discussions/readpdffile-v2-gives-error-when-reading-pdf-file/m-p/464521#M553</link>
      <description>&lt;P&gt;Hi &lt;a href="https://live.paloaltonetworks.com/t5/user/viewprofilepage/user-id/166751"&gt;@jwilkes&lt;/a&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I tried another file, the PDF present in the below site as testing. That also failed with the same error.&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;A href="https://www.ncsc.gov.uk/news/indicators-of-compromise-for-malware-used-by-apt28" target="_blank" rel="noopener"&gt;https://www.ncsc.gov.uk/news/indicators-of-compromise-for-malware-used-by-apt28&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Since I am experimenting I am using the playbook "&lt;SPAN&gt;Phishing - Generic v3". The ReadPDFFilev2 is present in it and it stops there with the above error.&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Wed, 09 Feb 2022 14:08:54 GMT</pubDate>
      <guid>https://live.paloaltonetworks.com/t5/cortex-xsoar-discussions/readpdffile-v2-gives-error-when-reading-pdf-file/m-p/464521#M553</guid>
      <dc:creator>pottapitot</dc:creator>
      <dc:date>2022-02-09T14:08:54Z</dc:date>
    </item>
    <item>
      <title>Re: ReadPDFFile V2 gives error when reading PDF file</title>
      <link>https://live.paloaltonetworks.com/t5/cortex-xsoar-discussions/readpdffile-v2-gives-error-when-reading-pdf-file/m-p/464542#M554</link>
      <description>&lt;P&gt;&lt;a href="https://live.paloaltonetworks.com/t5/user/viewprofilepage/user-id/208955"&gt;@pottapitot&lt;/a&gt;&amp;nbsp;,&lt;/P&gt;&lt;P&gt;I tried that same file for my XSOAR instance (6.2) and it failed as well.&amp;nbsp; Can you please create a support ticket to investigate this further?&amp;nbsp; I know that &lt;SPAN&gt;ReadPDFFileV2&amp;nbsp;uses the linux utility&amp;nbsp;&lt;/SPAN&gt;"pdftohtml" and maybe there are some limitations.&lt;BR /&gt;&lt;BR /&gt;I know we have found limitations before but they were with PDF encryption:&amp;nbsp;&lt;A href="https://xsoar.ideas.aha.io/ideas/FR-I-1397" target="_blank"&gt;https://xsoar.ideas.aha.io/ideas/FR-I-1397&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Wed, 09 Feb 2022 14:39:47 GMT</pubDate>
      <guid>https://live.paloaltonetworks.com/t5/cortex-xsoar-discussions/readpdffile-v2-gives-error-when-reading-pdf-file/m-p/464542#M554</guid>
      <dc:creator>jwilkes</dc:creator>
      <dc:date>2022-02-09T14:39:47Z</dc:date>
    </item>
    <item>
      <title>Re: ReadPDFFile V2 gives error when reading PDF file</title>
      <link>https://live.paloaltonetworks.com/t5/cortex-xsoar-discussions/readpdffile-v2-gives-error-when-reading-pdf-file/m-p/464546#M555</link>
      <description>&lt;P&gt;&lt;a href="https://live.paloaltonetworks.com/t5/user/viewprofilepage/user-id/166751"&gt;@jwilkes&lt;/a&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Wow! I am impressed by the speed of the resolution. I was looking through the automation script after my previous post when I noticed there was an update for the ReadPDFFileV2 script. I updated the automation and tried it again. Now it works perfectly!&lt;/P&gt;&lt;P&gt;I am not sure how you did it but once again thanks alot!&amp;nbsp;&lt;span class="lia-unicode-emoji" title=":grinning_face_with_big_eyes:"&gt;😃&lt;/span&gt;&lt;/P&gt;</description>
      <pubDate>Wed, 09 Feb 2022 14:52:19 GMT</pubDate>
      <guid>https://live.paloaltonetworks.com/t5/cortex-xsoar-discussions/readpdffile-v2-gives-error-when-reading-pdf-file/m-p/464546#M555</guid>
      <dc:creator>pottapitot</dc:creator>
      <dc:date>2022-02-09T14:52:19Z</dc:date>
    </item>
    <item>
      <title>Re: ReadPDFFile V2 gives error when reading PDF file</title>
      <link>https://live.paloaltonetworks.com/t5/cortex-xsoar-discussions/readpdffile-v2-gives-error-when-reading-pdf-file/m-p/464549#M556</link>
      <description>&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="jwilkes_0-1644418739377.png" style="width: 400px;"&gt;&lt;img src="https://live.paloaltonetworks.com/t5/image/serverpage/image-id/39042i2B06FEC138A56934/image-size/medium/is-moderation-mode/true?v=v2&amp;amp;px=400" role="button" title="jwilkes_0-1644418739377.png" alt="jwilkes_0-1644418739377.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;Yes, this looks related.&amp;nbsp; Glad to help!&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Wed, 09 Feb 2022 14:59:18 GMT</pubDate>
      <guid>https://live.paloaltonetworks.com/t5/cortex-xsoar-discussions/readpdffile-v2-gives-error-when-reading-pdf-file/m-p/464549#M556</guid>
      <dc:creator>jwilkes</dc:creator>
      <dc:date>2022-02-09T14:59:18Z</dc:date>
    </item>
  </channel>
</rss>

