{"id":1921,"date":"2011-02-08T18:50:00","date_gmt":"2011-02-08T18:50:00","guid":{"rendered":"http:\/\/www.b.shuttle.de\/hayek\/Hayek\/Jochen\/wp\/blog-en\/2011\/02\/08\/pdftohtml-vs-drm\/"},"modified":"2011-02-08T18:50:00","modified_gmt":"2011-02-08T18:50:00","slug":"pdftohtml-vs-drm","status":"publish","type":"post","link":"https:\/\/wp.jochen.hayek.name\/blog-en\/2011\/02\/08\/pdftohtml-vs-drm\/","title":{"rendered":"&#8220;pdftohtml&#8221; vs. DRM"},"content":{"rendered":"<p>\t\t\t\tA project of mine involves extracting strings and other details from PDF files using &#8220;<span>pdftohtml -xml<\/span>&#8220;.<\/p>\n<div>\n<\/div>\n<div>\nA plain\u00a0&#8220;<span>pdftohtml -xml<\/span>&#8221; refuses to read PDF files with set copy-protection bits set. But if you add &#8220;<span>-nodrm<\/span>&#8221; on the command line, it reads them anyway, but it mentions the problem on STDERR.<\/div>\n","protected":false},"excerpt":{"rendered":"<p>A project of mine involves extracting strings and other details from PDF files using &#8220;pdftohtml -xml&#8220;. A plain\u00a0&#8220;pdftohtml -xml&#8221; refuses to read PDF files with set copy-protection bits set. But if you add &#8220;-nodrm&#8221; on the command line, it reads them anyway, but it mentions the problem on STDERR.<\/p>\n","protected":false},"author":1,"featured_media":0,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"_jetpack_newsletter_access":"","_jetpack_dont_email_post_to_subs":false,"_jetpack_newsletter_tier_id":0,"_jetpack_memberships_contains_paywalled_content":false,"_jetpack_feature_clip_id":0,"_jetpack_memberships_contains_paid_content":false,"footnotes":"","jetpack_publicize_message":"","jetpack_publicize_feature_enabled":true,"jetpack_social_post_already_shared":false,"jetpack_social_options":{"image_generator_settings":{"template":"highway","default_image_id":0,"font":"","enabled":false},"version":2},"jetpack_post_was_ever_published":false,"_share_on_mastodon":"0"},"categories":[666],"tags":[],"class_list":["post-1921","post","type-post","status-publish","format-standard","hentry","category-uncategorized"],"share_on_mastodon":{"url":"","error":""},"jetpack_publicize_connections":[],"jetpack_featured_media_url":"","jetpack_sharing_enabled":true,"jetpack_shortlink":"https:\/\/wp.me\/paO0kP-uZ","jetpack_likes_enabled":true,"amp_enabled":true,"_links":{"self":[{"href":"https:\/\/wp.jochen.hayek.name\/blog-en\/wp-json\/wp\/v2\/posts\/1921","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/wp.jochen.hayek.name\/blog-en\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/wp.jochen.hayek.name\/blog-en\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/wp.jochen.hayek.name\/blog-en\/wp-json\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/wp.jochen.hayek.name\/blog-en\/wp-json\/wp\/v2\/comments?post=1921"}],"version-history":[{"count":0,"href":"https:\/\/wp.jochen.hayek.name\/blog-en\/wp-json\/wp\/v2\/posts\/1921\/revisions"}],"wp:attachment":[{"href":"https:\/\/wp.jochen.hayek.name\/blog-en\/wp-json\/wp\/v2\/media?parent=1921"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/wp.jochen.hayek.name\/blog-en\/wp-json\/wp\/v2\/categories?post=1921"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/wp.jochen.hayek.name\/blog-en\/wp-json\/wp\/v2\/tags?post=1921"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}