Delphi ActiveX
Delphi ActiveX
Extract Metadata XML from PDF
See more PDF Signatures Examples
Demonstrates how to extract the metadata XML from a PDF.Chilkat Delphi ActiveX Downloads
uses
Winapi.Windows, Winapi.Messages, System.SysUtils, System.Variants, System.Classes, Vcl.Graphics,
Vcl.Controls, Vcl.Forms, Vcl.Dialogs, Vcl.StdCtrls, Chilkat_TLB;
...
procedure TForm1.Button1Click(Sender: TObject);
var
success: Integer;
pdf: TChilkatPdf;
sbXml: TChilkatStringBuilder;
xml: TChilkatXml;
x_xmpmeta_xmlns_x: WideString;
x_xmpmeta_x_xmptk: WideString;
rdf_RDF_xmlns_rdf: WideString;
rdf_Description_rdf_about: WideString;
rdf_Description_xmlns_xmp: WideString;
rdf_Description_xmlns_dc: WideString;
rdf_Description_xmlns_xmpMM: WideString;
rdf_Description_xmlns_pdf: WideString;
rdf_Description_xmlns_xmpRights: WideString;
xmp_ModifyDate: WideString;
xmp_CreateDate: WideString;
xmp_MetadataDate: WideString;
xmp_CreatorTool: WideString;
dc_format: WideString;
rdf_li_xml_lang: WideString;
rdf_li: WideString;
i: Integer;
count_i: Integer;
xmpMM_DocumentID: WideString;
xmpMM_InstanceID: WideString;
pdf_Producer: WideString;
pdf_Keywords: WideString;
xmpRights_WebStatement: WideString;
begin
success := 0;
// This example requires the Chilkat API to have been previously unlocked.
// See Global Unlock Sample for sample code.
pdf := TChilkatPdf.Create(Self);
success := pdf.LoadFile('qa_data/pdf/blank_with_metadata.pdf');
if (success = 0) then
begin
Memo1.Lines.Add(pdf.LastErrorText);
Exit;
end;
sbXml := TChilkatStringBuilder.Create(Self);
// Note: Not all PDF files have metadata. Metadata is optional.
success := pdf.GetMetadata(sbXml.ControlInterface);
if (success = 0) then
begin
Memo1.Lines.Add(pdf.LastErrorText);
Exit;
end;
xml := TChilkatXml.Create(Self);
xml.LoadSb(sbXml.ControlInterface,1);
Memo1.Lines.Add(xml.GetXml());
// Sample PDF metadata XML:
// (Code for parsing follows)
// Use this online tool to generate parsing code from sample XML:
// Generate Parsing Code from XML
// <?xml version="1.0" encoding="utf-8"?>
// <x:xmpmeta xmlns:x="adobe:ns:meta/" x:xmptk="Adobe XMP Core 9.1-c001 79.675d0f7, 2023/06/11-19:21:16 ">
// <rdf:RDF xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#">
// <rdf:Description rdf:about="" xmlns:xmp="http://ns.adobe.com/xap/1.0/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:xmpMM="http://ns.adobe.com/xap/1.0/mm/" xmlns:pdf="http://ns.adobe.com/pdf/1.3/" xmlns:xmpRights="http://ns.adobe.com/xap/1.0/rights/">
// <xmp:ModifyDate>2024-11-27T11:33:12-06:00</xmp:ModifyDate>
// <xmp:CreateDate>2024-11-27T11:28:23-06:00</xmp:CreateDate>
// <xmp:MetadataDate>2024-11-27T11:33:12-06:00</xmp:MetadataDate>
// <xmp:CreatorTool>Adobe Acrobat Pro (32-bit) 24.3.20112</xmp:CreatorTool>
// <dc:format>application/pdf</dc:format>
// <dc:title>
// <rdf:Alt>
// <rdf:li xml:lang="x-default">Blank</rdf:li>
// </rdf:Alt>
// </dc:title>
// <dc:creator>
// <rdf:Bag>
// <rdf:li>Chilkat Software</rdf:li>
// </rdf:Bag>
// </dc:creator>
// <dc:description>
// <rdf:Alt>
// <rdf:li xml:lang="x-default">Blank Document</rdf:li>
// </rdf:Alt>
// </dc:description>
// <dc:subject>
// <rdf:Bag>
// <rdf:li>blank</rdf:li>
// <rdf:li>metadata</rdf:li>
// <rdf:li>document</rdf:li>
// </rdf:Bag>
// </dc:subject>
// <xmpMM:DocumentID>uuid:34535ffa-b632-43f1-b1fd-80cea6fdc351</xmpMM:DocumentID>
// <xmpMM:InstanceID>uuid:69ace620-4c54-407f-8d45-6eebc90f34c2</xmpMM:InstanceID>
// <pdf:Producer>Adobe Acrobat Pro (32-bit) 24.3.20112</pdf:Producer>
// <pdf:Keywords>blank; metadata; document</pdf:Keywords>
// <xmpRights:WebStatement>https://www.chilkatsoft.com/</xmpRights:WebStatement>
// </rdf:Description>
// </rdf:RDF>
// </x:xmpmeta>
x_xmpmeta_xmlns_x := xml.GetAttrValue('xmlns:x');
x_xmpmeta_x_xmptk := xml.GetAttrValue('x:xmptk');
rdf_RDF_xmlns_rdf := xml.ChilkatPath('rdf:RDF|(xmlns:rdf)');
rdf_Description_rdf_about := xml.ChilkatPath('rdf:RDF|rdf:Description|(rdf:about)');
rdf_Description_xmlns_xmp := xml.ChilkatPath('rdf:RDF|rdf:Description|(xmlns:xmp)');
rdf_Description_xmlns_dc := xml.ChilkatPath('rdf:RDF|rdf:Description|(xmlns:dc)');
rdf_Description_xmlns_xmpMM := xml.ChilkatPath('rdf:RDF|rdf:Description|(xmlns:xmpMM)');
rdf_Description_xmlns_pdf := xml.ChilkatPath('rdf:RDF|rdf:Description|(xmlns:pdf)');
rdf_Description_xmlns_xmpRights := xml.ChilkatPath('rdf:RDF|rdf:Description|(xmlns:xmpRights)');
xmp_ModifyDate := xml.GetChildContent('rdf:RDF|rdf:Description|xmp:ModifyDate');
xmp_CreateDate := xml.GetChildContent('rdf:RDF|rdf:Description|xmp:CreateDate');
xmp_MetadataDate := xml.GetChildContent('rdf:RDF|rdf:Description|xmp:MetadataDate');
xmp_CreatorTool := xml.GetChildContent('rdf:RDF|rdf:Description|xmp:CreatorTool');
dc_format := xml.GetChildContent('rdf:RDF|rdf:Description|dc:format');
rdf_li_xml_lang := xml.ChilkatPath('rdf:RDF|rdf:Description|dc:title|rdf:Alt|rdf:li|(xml:lang)');
rdf_li := xml.GetChildContent('rdf:RDF|rdf:Description|dc:title|rdf:Alt|rdf:li');
rdf_li := xml.GetChildContent('rdf:RDF|rdf:Description|dc:creator|rdf:Bag|rdf:li');
rdf_li_xml_lang := xml.ChilkatPath('rdf:RDF|rdf:Description|dc:description|rdf:Alt|rdf:li|(xml:lang)');
rdf_li := xml.GetChildContent('rdf:RDF|rdf:Description|dc:description|rdf:Alt|rdf:li');
i := 0;
count_i := xml.NumChildrenHavingTag('rdf:RDF|rdf:Description|dc:subject|rdf:Bag|rdf:li');
while i < count_i do
begin
xml.I := i;
rdf_li := xml.GetChildContent('rdf:RDF|rdf:Description|dc:subject|rdf:Bag|rdf:li[i]');
i := i + 1;
end;
xmpMM_DocumentID := xml.GetChildContent('rdf:RDF|rdf:Description|xmpMM:DocumentID');
xmpMM_InstanceID := xml.GetChildContent('rdf:RDF|rdf:Description|xmpMM:InstanceID');
pdf_Producer := xml.GetChildContent('rdf:RDF|rdf:Description|pdf:Producer');
pdf_Keywords := xml.GetChildContent('rdf:RDF|rdf:Description|pdf:Keywords');
xmpRights_WebStatement := xml.GetChildContent('rdf:RDF|rdf:Description|xmpRights:WebStatement');
end;