Sample code for 30+ languages & platforms
Unicode C

Extract Metadata XML from PDF

See more PDF Signatures Examples

Demonstrates how to extract the metadata XML from a PDF.

Chilkat Unicode C Downloads

Unicode C
#include <C_CkPdfW.h>
#include <C_CkStringBuilderW.h>
#include <C_CkXmlW.h>

void ChilkatSample(void)
    {
    BOOL success;
    HCkPdfW pdf;
    HCkStringBuilderW sbXml;
    HCkXmlW xml;
    const wchar_t *x_xmpmeta_xmlns_x;
    const wchar_t *x_xmpmeta_x_xmptk;
    const wchar_t *rdf_RDF_xmlns_rdf;
    const wchar_t *rdf_Description_rdf_about;
    const wchar_t *rdf_Description_xmlns_xmp;
    const wchar_t *rdf_Description_xmlns_dc;
    const wchar_t *rdf_Description_xmlns_xmpMM;
    const wchar_t *rdf_Description_xmlns_pdf;
    const wchar_t *rdf_Description_xmlns_xmpRights;
    const wchar_t *xmp_ModifyDate;
    const wchar_t *xmp_CreateDate;
    const wchar_t *xmp_MetadataDate;
    const wchar_t *xmp_CreatorTool;
    const wchar_t *dc_format;
    const wchar_t *rdf_li_xml_lang;
    const wchar_t *rdf_li;
    int i;
    int count_i;
    const wchar_t *xmpMM_DocumentID;
    const wchar_t *xmpMM_InstanceID;
    const wchar_t *pdf_Producer;
    const wchar_t *pdf_Keywords;
    const wchar_t *xmpRights_WebStatement;

    success = FALSE;

    // This example requires the Chilkat API to have been previously unlocked.
    // See Global Unlock Sample for sample code.

    pdf = CkPdfW_Create();

    success = CkPdfW_LoadFile(pdf,L"qa_data/pdf/blank_with_metadata.pdf");
    if (success == FALSE) {
        wprintf(L"%s\n",CkPdfW_lastErrorText(pdf));
        CkPdfW_Dispose(pdf);
        return;
    }

    sbXml = CkStringBuilderW_Create();
    // Note: Not all PDF files have metadata.  Metadata is optional.
    success = CkPdfW_GetMetadata(pdf,sbXml);
    if (success == FALSE) {
        wprintf(L"%s\n",CkPdfW_lastErrorText(pdf));
        CkPdfW_Dispose(pdf);
        CkStringBuilderW_Dispose(sbXml);
        return;
    }

    xml = CkXmlW_Create();
    CkXmlW_LoadSb(xml,sbXml,TRUE);

    wprintf(L"%s\n",CkXmlW_getXml(xml));

    // Sample PDF metadata XML:
    // (Code for parsing follows)

    // Use this online tool to generate parsing code from sample XML: 
    // Generate Parsing Code from XML

    // <?xml version="1.0" encoding="utf-8"?>
    // <x:xmpmeta xmlns:x="adobe:ns:meta/" x:xmptk="Adobe XMP Core 9.1-c001 79.675d0f7, 2023/06/11-19:21:16        ">
    //     <rdf:RDF xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#">
    //         <rdf:Description rdf:about="" xmlns:xmp="http://ns.adobe.com/xap/1.0/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:xmpMM="http://ns.adobe.com/xap/1.0/mm/" xmlns:pdf="http://ns.adobe.com/pdf/1.3/" xmlns:xmpRights="http://ns.adobe.com/xap/1.0/rights/">
    //             <xmp:ModifyDate>2024-11-27T11:33:12-06:00</xmp:ModifyDate>
    //             <xmp:CreateDate>2024-11-27T11:28:23-06:00</xmp:CreateDate>
    //             <xmp:MetadataDate>2024-11-27T11:33:12-06:00</xmp:MetadataDate>
    //             <xmp:CreatorTool>Adobe Acrobat Pro (32-bit) 24.3.20112</xmp:CreatorTool>
    //             <dc:format>application/pdf</dc:format>
    //             <dc:title>
    //                 <rdf:Alt>
    //                     <rdf:li xml:lang="x-default">Blank</rdf:li>
    //                 </rdf:Alt>
    //             </dc:title>
    //             <dc:creator>
    //                 <rdf:Bag>
    //                     <rdf:li>Chilkat Software</rdf:li>
    //                 </rdf:Bag>
    //             </dc:creator>
    //             <dc:description>
    //                 <rdf:Alt>
    //                     <rdf:li xml:lang="x-default">Blank Document</rdf:li>
    //                 </rdf:Alt>
    //             </dc:description>
    //             <dc:subject>
    //                 <rdf:Bag>
    //                     <rdf:li>blank</rdf:li>
    //                     <rdf:li>metadata</rdf:li>
    //                     <rdf:li>document</rdf:li>
    //                 </rdf:Bag>
    //             </dc:subject>
    //             <xmpMM:DocumentID>uuid:34535ffa-b632-43f1-b1fd-80cea6fdc351</xmpMM:DocumentID>
    //             <xmpMM:InstanceID>uuid:69ace620-4c54-407f-8d45-6eebc90f34c2</xmpMM:InstanceID>
    //             <pdf:Producer>Adobe Acrobat Pro (32-bit) 24.3.20112</pdf:Producer>
    //             <pdf:Keywords>blank; metadata; document</pdf:Keywords>
    //             <xmpRights:WebStatement>https://www.chilkatsoft.com/</xmpRights:WebStatement>
    //         </rdf:Description>
    //     </rdf:RDF>
    // </x:xmpmeta>

    x_xmpmeta_xmlns_x = CkXmlW_getAttrValue(xml,L"xmlns:x");
    x_xmpmeta_x_xmptk = CkXmlW_getAttrValue(xml,L"x:xmptk");
    rdf_RDF_xmlns_rdf = CkXmlW_chilkatPath(xml,L"rdf:RDF|(xmlns:rdf)");
    rdf_Description_rdf_about = CkXmlW_chilkatPath(xml,L"rdf:RDF|rdf:Description|(rdf:about)");
    rdf_Description_xmlns_xmp = CkXmlW_chilkatPath(xml,L"rdf:RDF|rdf:Description|(xmlns:xmp)");
    rdf_Description_xmlns_dc = CkXmlW_chilkatPath(xml,L"rdf:RDF|rdf:Description|(xmlns:dc)");
    rdf_Description_xmlns_xmpMM = CkXmlW_chilkatPath(xml,L"rdf:RDF|rdf:Description|(xmlns:xmpMM)");
    rdf_Description_xmlns_pdf = CkXmlW_chilkatPath(xml,L"rdf:RDF|rdf:Description|(xmlns:pdf)");
    rdf_Description_xmlns_xmpRights = CkXmlW_chilkatPath(xml,L"rdf:RDF|rdf:Description|(xmlns:xmpRights)");
    xmp_ModifyDate = CkXmlW_getChildContent(xml,L"rdf:RDF|rdf:Description|xmp:ModifyDate");
    xmp_CreateDate = CkXmlW_getChildContent(xml,L"rdf:RDF|rdf:Description|xmp:CreateDate");
    xmp_MetadataDate = CkXmlW_getChildContent(xml,L"rdf:RDF|rdf:Description|xmp:MetadataDate");
    xmp_CreatorTool = CkXmlW_getChildContent(xml,L"rdf:RDF|rdf:Description|xmp:CreatorTool");
    dc_format = CkXmlW_getChildContent(xml,L"rdf:RDF|rdf:Description|dc:format");
    rdf_li_xml_lang = CkXmlW_chilkatPath(xml,L"rdf:RDF|rdf:Description|dc:title|rdf:Alt|rdf:li|(xml:lang)");
    rdf_li = CkXmlW_getChildContent(xml,L"rdf:RDF|rdf:Description|dc:title|rdf:Alt|rdf:li");
    rdf_li = CkXmlW_getChildContent(xml,L"rdf:RDF|rdf:Description|dc:creator|rdf:Bag|rdf:li");
    rdf_li_xml_lang = CkXmlW_chilkatPath(xml,L"rdf:RDF|rdf:Description|dc:description|rdf:Alt|rdf:li|(xml:lang)");
    rdf_li = CkXmlW_getChildContent(xml,L"rdf:RDF|rdf:Description|dc:description|rdf:Alt|rdf:li");
    i = 0;
    count_i = CkXmlW_NumChildrenHavingTag(xml,L"rdf:RDF|rdf:Description|dc:subject|rdf:Bag|rdf:li");
    while (i < count_i) {
        CkXmlW_putI(xml,i);
        rdf_li = CkXmlW_getChildContent(xml,L"rdf:RDF|rdf:Description|dc:subject|rdf:Bag|rdf:li[i]");
        i = i + 1;
    }

    xmpMM_DocumentID = CkXmlW_getChildContent(xml,L"rdf:RDF|rdf:Description|xmpMM:DocumentID");
    xmpMM_InstanceID = CkXmlW_getChildContent(xml,L"rdf:RDF|rdf:Description|xmpMM:InstanceID");
    pdf_Producer = CkXmlW_getChildContent(xml,L"rdf:RDF|rdf:Description|pdf:Producer");
    pdf_Keywords = CkXmlW_getChildContent(xml,L"rdf:RDF|rdf:Description|pdf:Keywords");
    xmpRights_WebStatement = CkXmlW_getChildContent(xml,L"rdf:RDF|rdf:Description|xmpRights:WebStatement");


    CkPdfW_Dispose(pdf);
    CkStringBuilderW_Dispose(sbXml);
    CkXmlW_Dispose(xml);

    }