question

Upvotes
Accepted
1 1 0 1

How should multiple records in the entity bulk download be interpreted?

Looking at the bulk download for organizations from here: https://permid.org/download

I find multiple records for the same PermID. How should I reconcile conflicting information across these records? Does the record with the highest line number the file have the correct data? Here are some example records for PermID = 4296182513.

194571:<https://permid.org/1-4296182513>
194572-        a                               tr-org:Organization ;
194573-        mdaas:HeadquartersAddress       "2479 E Bayshore Rd Ste 195\nPALO ALTO\nCALIFORNIA\n94303-3230\nUnited States\n"^^xsd:string ;
194574-        mdaas:RegisteredAddress         "112 North Curry St\nCARSON CITY\nNEVADA\n89703\nUnited States\n"^^xsd:string ;
194575-        tr-common:hasPermId             "4296182513"^^xsd:string ;
194576-        tr-fin:hasOrganizationPrimaryQuote
194577-                <https://permid.org/1-21539925349> ;
194578-        tr-fin:hasPrimaryInstrument     <https://permid.org/1-8589997596> ;
194579-        tr-org:hasActivityStatus        tr-org:statusActive ;
194580-        tr-org:hasHeadquartersFaxNumber
194581-                "14088241543"^^xsd:string ;
194582-        tr-org:hasHeadquartersPhoneNumber
194583-                "14087022167"^^xsd:string ;
194584-        tr-org:hasHoldingClassification
194585-                tr-org:publiclyHeld ;
194586-        tr-org:hasLatestOrganizationFoundedDate
194587-                "1999-04-08T00:00:00Z"^^xsd:dateTime ;
194588-        tr-org:hasPrimaryBusinessSector
194589-                <https://permid.org/1-4294952830> ;
194590-        tr-org:hasPrimaryEconomicSector
194591-                <https://permid.org/1-4294952723> ;
194592-        tr-org:hasPrimaryIndustryGroup  <https://permid.org/1-4294952829> ;
194593-        tr-org:isIncorporatedIn         <http://sws.geonames.org/6252001/> ;
194594-        fibo-be-le-cb:isDomiciledIn     <http://sws.geonames.org/6252001/> ;
194595-        vcard:hasURL                    <http://www.sysorex.com/> ;
194596-        vcard:organization-name         "Sysorex Global"^^xsd:string .
--
266704:<https://permid.org/1-4296182513>
266705-        a                               tr-org:Organization ;
266706-        mdaas:HeadquartersAddress       "2479 E Bayshore Rd Ste 195\nPALO ALTO\nCALIFORNIA\n94303\nUnited States\n"^^xsd:string ;
266707-        mdaas:RegisteredAddress         "112 N Curry St\nCARSON CITY\nNEVADA\n89703-4934\nUnited States\n"^^xsd:string ;
266708-        tr-common:hasPermId             "4296182513"^^xsd:string ;
266709-        tr-fin:hasOrganizationPrimaryQuote
266710-                <https://permid.org/1-21539925349> ;
266711-        tr-fin:hasPrimaryInstrument     <https://permid.org/1-8589997596> ;
266712-        tr-org:hasActivityStatus        tr-org:statusActive ;
266713-        tr-org:hasHeadquartersFaxNumber
266714-                "14088241543"^^xsd:string ;
266715-        tr-org:hasHeadquartersPhoneNumber
266716-                "14087022167"^^xsd:string ;
266717-        tr-org:hasHoldingClassification
266718-                tr-org:publiclyHeld ;
266719-        tr-org:hasIPODate               "2014-04-10T04:00:00Z"^^xsd:dateTime ;
266720-        tr-org:hasLatestOrganizationFoundedDate
266721-                "1999-04-08T00:00:00Z"^^xsd:dateTime ;
266722-        tr-org:hasPrimaryBusinessSector
266723-                <https://permid.org/1-4294952830> ;
266724-        tr-org:hasPrimaryEconomicSector
266725-                <https://permid.org/1-4294952723> ;
266726-        tr-org:hasPrimaryIndustryGroup  <https://permid.org/1-4294952829> ;
266727-        tr-org:isIncorporatedIn         <http://sws.geonames.org/6252001/> ;
266728-        fibo-be-le-cb:isDomiciledIn     <http://sws.geonames.org/6252001/> ;
266729-        vcard:hasURL                    <http://sysorex.com/> ;
266730-        vcard:organization-name         "Sysorex Global"^^xsd:string .
--
35184710:<https://permid.org/1-4296182513>
35184711-        a                               tr-org:Organization ;
35184712-        mdaas:HeadquartersAddress       "2479 E Bayshore Rd Ste 195\nPALO ALTO\nCALIFORNIA\n94303-3245\nUnited States\n"^^xsd:string ;
35184713-        mdaas:RegisteredAddress         "112 North Curry Street\nCARSON CITY\nNEVADA\n89703-4934\nUnited States\n"^^xsd:string ;
35184714-        tr-common:hasPermId             "4296182513"^^xsd:string ;
35184715-        tr-fin:hasOrganizationPrimaryQuote
35184716-                <https://permid.org/1-21539925349> ;
35184717-        tr-fin:hasPrimaryInstrument     <https://permid.org/1-8589997596> ;
35184718-        tr-org:hasActivityStatus        tr-org:statusActive ;
35184719-        tr-org:hasHeadquartersFaxNumber
35184720-                "14088241543"^^xsd:string ;
35184721-        tr-org:hasHeadquartersPhoneNumber
35184722-                "14087022167"^^xsd:string ;
35184723-        tr-org:hasHoldingClassification
35184724-                tr-org:publiclyHeld ;
35184725-        tr-org:hasIPODate               "2014-04-10T04:00:00Z"^^xsd:dateTime ;
35184726-        tr-org:hasLatestOrganizationFoundedDate
35184727-                "1999-04-08T00:00:00Z"^^xsd:dateTime ;
35184728-        tr-org:hasPrimaryBusinessSector
35184729-                <https://permid.org/1-4294952830> ;
35184730-        tr-org:hasPrimaryEconomicSector
35184731-                <https://permid.org/1-4294952723> ;
35184732-        tr-org:hasPrimaryIndustryGroup  <https://permid.org/1-4294952829> ;
35184733-        tr-org:isIncorporatedIn         <http://sws.geonames.org/6252001/> ;
35184734-        fibo-be-le-cb:isDomiciledIn     <http://sws.geonames.org/6252001/> ;
35184735-        vcard:hasURL                    <http://sysorex.com/> ;
35184736-        vcard:organization-name         "Inpixon"^^xsd:string .
--
37577944:<https://permid.org/1-4296182513>
37577945-        a                               tr-org:Organization ;
37577946-        mdaas:HeadquartersAddress       "2479 E Bayshore Rd Ste 195\nPALO ALTO\nCALIFORNIA\n94303-3245\nUnited States\n"^^xsd:string ;
37577947-        mdaas:RegisteredAddress         "112 N Curry St\nCARSON CITY\nNEVADA\n89703-4934\nUnited States\n"^^xsd:string ;
37577948-        tr-common:hasPermId             "4296182513"^^xsd:string ;
37577949-        tr-fin:hasOrganizationPrimaryQuote
37577950-                <https://permid.org/1-21539925349> ;
37577951-        tr-fin:hasPrimaryInstrument     <https://permid.org/1-8589997596> ;
37577952-        tr-org:hasActivityStatus        tr-org:statusActive ;
37577953-        tr-org:hasHeadquartersFaxNumber
37577954-                "14088241543"^^xsd:string ;
37577955-        tr-org:hasHeadquartersPhoneNumber
37577956-                "14087022167"^^xsd:string ;
37577957-        tr-org:hasHoldingClassification
37577958-                tr-org:publiclyHeld ;
37577959-        tr-org:hasIPODate               "2002-05-29T04:00:00Z"^^xsd:dateTime ;
37577960-        tr-org:hasLatestOrganizationFoundedDate
37577961-                "1999-04-08T00:00:00Z"^^xsd:dateTime ;
37577962-        tr-org:hasPrimaryBusinessSector
37577963-                <https://permid.org/1-4294952830> ;
37577964-        tr-org:hasPrimaryEconomicSector
37577965-                <https://permid.org/1-4294952723> ;
37577966-        tr-org:hasPrimaryIndustryGroup  <https://permid.org/1-4294952829> ;
37577967-        tr-org:isIncorporatedIn         <http://sws.geonames.org/6252001/> ;
37577968-        fibo-be-le-cb:isDomiciledIn     <http://sws.geonames.org/6252001/> ;
37577969-        vcard:hasURL                    <https://inpixon.com/> ;
37577970-        vcard:organization-name         "Inpixon"^^xsd:string .
--
permid-apiintelligent-tagging-apiopen-permid-apiDownloadbulk-downloadentity
icon clock
10 |1500

Up to 2 attachments (including images) can be used with a maximum of 512.0 KiB each and 1.0 MiB total.

Asked experts, Eran and Tsafi to help with this question

Sent an email to CLFHelpDesk@thomsonreuters.com, so its triage will be extended 1 week further.

Updated:

From: CLFHelpDesk@thomsonreuters.com

c.c.: Vladimir.Rozhavsky@thomsonreuters.com

Hi Nipat,


We are investigating this issue and will get back with an update soon. 


Thanks and Regards,
CLF HELPDESK

Please see the resent update from TMSTech Content Support team:

Hi,

The duplicate permID records in
the bulk file is a known issue, currently being handled by our QA team.
We hope the fix will be provided
soon, we will keep you updated. 


Regards,
Matan Gafni
Content Monitoring & BI Analyst
Thomson Reuters
matan.gafni@thomsonreuters.com

I've sent a follow-up email to Matan so please wait for the reply.

Below is the update:

Hi Nipat,

Many of the duplicated permIDs
are now fixed, but the issue is ongoing and new duplicate records might appear.

A more robust solution to this
issue is expected to be implemented next month.

Will keep you posted.


Regards,
Matan Gafni

Content Monitoring & BI Analyst
Thomson Reuters

Contacted CLF HelpDesk to answer this question.

Upvotes
Accepted
78.8k 250 52 74
@amarder

The development team has acknowledged this issue. They will fix this issue but at the moment there is no specific date for the fix.

For duplicated records, you should take the last one with the highest line number.

icon clock
10 |1500

Up to 2 attachments (including images) can be used with a maximum of 512.0 KiB each and 1.0 MiB total.

I found the latest version of the bulk organization file has one only entry for 1-5045849264. Therefore, this issue has been resolved.

Upvotes
78.8k 250 52 74

@amarder

The new version of Organization file is available on 29 Oct 2017 (OpenPermID-bulk-organization-20171029_070342.ttl). I have verified it and there is no duplicated entry for 1-429618251.

Could you please use the new file and let us know the result?

icon clock
10 |1500

Up to 2 attachments (including images) can be used with a maximum of 512.0 KiB each and 1.0 MiB total.

Upvotes
1 1 0 1

@jirapongse.phuriphanvichai

Thanks for following up. Looking at the new file, I agree there is a single entry for 1-4296182513. Unfortunately, other PermIDs still have multiple entries. For instance, here are the four entries for 1-5045849264:

433502:<https://permid.org/1-5045849264>
433503-        a                            tr-org:Organization ;
433504-        mdaas:HeadquartersAddress    "Singapore\n"^^xsd:string ;
433505-        tr-common:hasPermId          "5045849264"^^xsd:string ;
433506-        tr-org:hasActivityStatus     tr-org:statusActive ;
433507-        tr-org:hasLEI                "549300DYX0UTSCF6MS89"^^xsd:string ;
433508-        fibo-be-le-cb:isDomiciledIn  <http://sws.geonames.org/1880251/> ;
433509-        vcard:hasURL                 <http://pnd-hardware.com/> ;
433510-        vcard:organization-name      "PND Hardware & Trading Pte Ltd"^^xsd:string .
--
558416:<https://permid.org/1-5045849264>
558417-        a                              tr-org:Organization ;
558418-        mdaas:HeadquartersAddress      "13 Gul Link\n629383\nSingapore\n"^^xsd:string ;
558419-        mdaas:RegisteredAddress        "13 Gul Link\n629383\nSingapore\n"^^xsd:string ;
558420-        tr-common:hasPermId            "5045849264"^^xsd:string ;
558421-        tr-org:hasActivityStatus       tr-org:statusActive ;
558422-        tr-org:hasHeadquartersFaxNumber
558423-                "6565666298"^^xsd:string ;
558424-        tr-org:hasHeadquartersPhoneNumber
558425-                "6565656233"^^xsd:string ;
558426-        tr-org:hasLEI                  "549300DYX0UTSCF6MS89"^^xsd:string ;
558427-        tr-org:hasRegisteredFaxNumber  "6565666298"^^xsd:string ;
558428-        tr-org:hasRegisteredPhoneNumber
558429-                "6565656233"^^xsd:string ;
558430-        tr-org:isIncorporatedIn        <http://sws.geonames.org/1880251/> ;
558431-        fibo-be-le-cb:isDomiciledIn    <http://sws.geonames.org/1880251/> ;
558432-        vcard:hasURL                   <http://pnd-hardware.com/> ;
558433-        vcard:organization-name        "PND Hardware & Trading Pte Ltd"^^xsd:string .
--
27452944:<https://permid.org/1-5045849264>
27452945-        a                              tr-org:Organization ;
27452946-        mdaas:HeadquartersAddress      "13 Gul Link\n629383\nSingapore\n"^^xsd:string ;
27452947-        mdaas:RegisteredAddress        "13 Gul Link\n629383\nSingapore\n"^^xsd:string ;
27452948-        tr-common:hasPermId            "5045849264"^^xsd:string ;
27452949-        tr-org:hasActivityStatus       tr-org:statusActive ;
27452950-        tr-org:hasHeadquartersFaxNumber
27452951-                "6565666298"^^xsd:string ;
27452952-        tr-org:hasHeadquartersPhoneNumber
27452953-                "6565656233"^^xsd:string ;
27452954-        tr-org:hasLEI                  "549300DYX0UTSCF6MS89"^^xsd:string ;
27452955-        tr-org:hasRegisteredFaxNumber  "6565666298"^^xsd:string ;
27452956-        tr-org:hasRegisteredPhoneNumber
27452957-                "6565656233"^^xsd:string ;
27452958-        tr-org:isIncorporatedIn        <http://sws.geonames.org/1880251/> ;
27452959-        fibo-be-le-cb:isDomiciledIn    <http://sws.geonames.org/1880251/> ;
27452960-        vcard:hasURL                   <http://pnd-hardware.com/> ;
27452961-        vcard:organization-name        "PND Hardware & Trading Pte Ltd"^^xsd:string .
--
38847298:<https://permid.org/1-5045849264>
38847299-        a                              tr-org:Organization ;
38847300-        mdaas:HeadquartersAddress      "13 Gul Link\n629383\nSingapore\n"^^xsd:string ;
38847301-        mdaas:RegisteredAddress        "13 Gul Link\n629383\nSingapore\n"^^xsd:string ;
38847302-        tr-common:hasPermId            "5045849264"^^xsd:string ;
38847303-        tr-org:hasActivityStatus       tr-org:statusActive ;
38847304-        tr-org:hasHeadquartersFaxNumber
38847305-                "6565666298"^^xsd:string ;
38847306-        tr-org:hasHeadquartersPhoneNumber
38847307-                "6565656233"^^xsd:string ;
38847308-        tr-org:hasLEI                  "549300DYX0UTSCF6MS89"^^xsd:string ;
38847309-        tr-org:hasRegisteredFaxNumber  "6565666298"^^xsd:string ;
38847310-        tr-org:hasRegisteredPhoneNumber
38847311-                "6565656233"^^xsd:string ;
38847312-        tr-org:isIncorporatedIn        <http://sws.geonames.org/1880251/> ;
38847313-        fibo-be-le-cb:isDomiciledIn    <http://sws.geonames.org/1880251/> ;
38847314-        vcard:hasURL                   <http://pnd-hardware.com/> ;
38847315-        vcard:organization-name        "PND Hardware & Trading Pte Ltd"^^xsd:string .

icon clock
10 |1500

Up to 2 attachments (including images) can be used with a maximum of 512.0 KiB each and 1.0 MiB total.

@amarder

Thank you so much for the information.

I will contact the support team to verify it.

Write an Answer

Hint: Notify or tag a user in this post by typing @username.

Up to 2 attachments (including images) can be used with a maximum of 512.0 KiB each and 1.0 MiB total.