This page describes the use cases, requirements and draft specification titled "ebXML RegRep Profile for PDF Documents":

Vision

Use Cases Illustrated By Example CQL Queries

Here are example of a few use cases. Note that a query can contain multiple predicates using boolean operation AND, OR as defined by CQL.

Requirements

Specification

PDF Context Set

The following are a subset of PDF metadata properties that have been identified as the indexes for a CQL Context Set for PDF Resources. These will be used in left hand side of relations such as "=", "<" etc. in query predicates (e.g. pdf.numberOfPages < 100 ). Each index name (e.g. numberOfPages) will be used to match a slot with same name on the ExtrinsicObject for PDF resources.The slot value will be compared with the search term (right hand side of the relation as in 100 in pdf.numberOfPages > 100 ). The type of the Value element of the Slot will be defined by the type of the index in table below. For example int types will be mapped to IntegerValueType, string to StringValueType, etc.

Unless otherwise specified the Metadata Properties are defined by Table 317 – Entries in the document information dictionary in [PDF 32000-1:2008].

Metadata Property

Index Name

Data Type

Description

Author

author

string

CreationDate

creationDate

dateTime

Creator

creator

string

Keywords

keywords

string

ModDate

modificationDate

dateTime

Producer

producer

string

Subject

subject

string

Title

title

string

Trapped

trapped

boolean

NumberOfPages

numberOfPages

integer

The total number of pages in the PDF document

Canonical Data Defined By Profile

<?xml version="1.0" encoding="UTF-8"?>
<SubmitObjectsRequest id="urn:oasis:names:tc:ebxml-regrep:request:id" 
                      xmlns="urn:oasis:names:tc:ebxml-regrep:xsd:lcm:4.0"
                      xmlns:lcm="urn:oasis:names:tc:ebxml-regrep:xsd:lcm:4.0"
                      xmlns:query="urn:oasis:names:tc:ebxml-regrep:xsd:query:4.0"
                      xmlns:rim="urn:oasis:names:tc:ebxml-regrep:xsd:rim:4.0"
                      xmlns:rs="urn:oasis:names:tc:ebxml-regrep:xsd:rs:4.0"
                      xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
                      xmlns:xlink="http://www.w3.org/1999/xlink"
                      xsi:schemaLocation="urn:oasis:names:tc:ebxml-regrep:xsd:lcm:4.0  http://docs.oasis-open.org/regrep/regrep-core/v4.0/cos01/xsd/lcm.xsd">
    <rim:RegistryObjectList>
        
        <rim:RegistryObject xsi:type="rim:RegistryPackageType" lid="urn:oasis:names:tc:ebxml-regrep:profile:pdf" id="urn:oasis:names:tc:ebxml-regrep:profile:pdf">
            <rim:Name>
                <rim:LocalizedString value="PDF Profile"/>
            </rim:Name>
            <rim:Description>
                <rim:LocalizedString value="Folder for all objects defined by the PDF Profile of ebXML RegRep."/>
            </rim:Description>
            <rim:VersionInfo userVersionName="1.0"/>
            <rim:RegistryObjectList>
    
                <!--
                ObjectType definitions.
                -->
                <rim:RegistryObject xsi:type="rim:ClassificationNodeType" parent="urn:oasis:names:tc:ebxml-regrep:ObjectType:RegistryObject:ExtrinsicObject" 
                    code="pdf" 
                    lid="urn:oasis:names:tc:ebxml-regrep:profile:pdf:ObjectType:pdf"
                    id="urn:oasis:names:tc:ebxml-regrep:profile:pdf:ObjectType:pdf">
                    <rim:Name>
                        <rim:LocalizedString value="PDF"/>
                    </rim:Name>                                        
                </rim:RegistryObject>        
                
            </rim:RegistryObjectList>
        </rim:RegistryObject>
    </rim:RegistryObjectList>
    
</SubmitObjectsRequest>

Example of Cataloged ExtrinsicObject for a PDF Resource

<?xml version="1.0" encoding="UTF-8" standalone="yes"?>
<RegistryObject xsi:type="ExtrinsicObjectType" mimeType="application/pdf" lid="urn:test:PDFProfile:pdf:InstallGuide-4.13.pdf" objectType="urn:oasis:names:tc:ebxml-regrep:profile:pdf:ObjectType:pdf" owner="rod" status="urn:oasis:names:tc:ebxml-regrep:StatusType:Submitted" id="urn:test:PDFProfile:pdf:InstallGuide-4.13.pdf" xmlns:ns2="http://www.w3.org/1999/xlink" xmlns="urn:oasis:names:tc:ebxml-regrep:xsd:rim:4.0" xmlns:ns4="urn:oasis:names:tc:ebxml-regrep:xsd:rs:4.0" xmlns:ns3="http://www.w3.org/2005/08/addressing" xmlns:ns9="http://www.w3.org/2001/SMIL20/" xmlns:ns5="urn:oasis:names:tc:ebxml-regrep:xsd:spi:4.0" xmlns:ns6="urn:oasis:names:tc:ebxml-regrep:xsd:query:4.0" xmlns:ns10="http://www.w3.org/2001/SMIL20/Language" xmlns:ns7="urn:oasis:names:tc:ebxml-regrep:xsd:lcm:4.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:ns8="http://www.opengis.net/gml">
    <Slot name="urn:oasis:names:tc:ebxml-regrep:rim:RegistryObject:locators">
        <SlotValue xsi:type="CollectionValueType" collectionType="urn:oasis:names:tc:ebxml-regrep:CollectionType:List">
            <Element xsi:type="StringValueType">
                <Value>pdf/InstallGuide-4.13.pdf</Value>
            </Element>
        </SlotValue>
    </Slot>
    <Slot name="creator">
        <SlotValue xsi:type="StringValueType">
            <Value>Writer</Value>
        </SlotValue>
    </Slot>
    <Slot name="creationDate">
        <SlotValue xsi:type="DateTimeValueType">
            <Value>2013-08-29T14:31:36.000</Value>
        </SlotValue>
    </Slot>
    <Slot name="author">
        <SlotValue xsi:type="StringValueType">
            <Value>Farrukh Najmi</Value>
        </SlotValue>
    </Slot>
    <Slot name="title">
        <SlotValue xsi:type="StringValueType">
            <Value>RegRep Installation and Administration Guide</Value>
        </SlotValue>
    </Slot>
    <Slot name="producer">
        <SlotValue xsi:type="StringValueType">
            <Value>LibreOffice 3.4</Value>
        </SlotValue>
    </Slot>
    <Slot name="numberOfPages">
        <SlotValue xsi:type="IntegerValueType">
            <Value>51</Value>
        </SlotValue>
    </Slot>
    <Name>
        <LocalizedString xml:lang="en-US" value="InstallGuide-4.13.pdf"/>
    </Name>
    <Description>
        <LocalizedString xml:lang="en-US" value=""/>
    </Description>
    <VersionInfo versionName="4b962727c8a7ba21fc5c4bf2b7e7cb6c081289ad" userVersionName=""/>
    <ContentVersionInfo versionName="2fba87dfdd141914614933b9923f3b973b333ad9"/>
    <RepositoryItem>....ommitted....</RepositoryItem>
</RegistryObject>

Open Issues

References

documents/plan/regrep4/PdfProfile (last edited 2013-10-28 14:42:54 by farrukh)