Index: fmts/trunk/p/C0XF2N.m
===================================================================
--- fmts/trunk/p/C0XF2N.m	(revision 1281)
+++ fmts/trunk/p/C0XF2N.m	(revision 1294)
@@ -1,4 +1,4 @@
-C0XMAIN ; GPL - Fileman Triples entry point routine ;10/13/11  17:05
- ;;0.1;C0X;nopatch;noreleasedate;Build 1
+C0XF2N ; GPL - Fileman Triples entry point routine ;10/13/11  17:05
+ ;;0.1;C0X;nopatch;noreleasedate;Build 5
  ;Copyright 2011 George Lilly.  Licensed under the terms of the GNU
  ;General Public License See attached copy of the License.
@@ -33,9 +33,10 @@
  ; FOR THE DEFAULT TRIPLE STORE. USE OTHER VALUES FOR SUPPORTING ADDITIONAL
  ; TRIPLE STORES
+ I $D(@ZFARY) Q  ; ALREADY INITIALIZED
  S @ZFARY@("C0XTFN")=172.101 ; TRIPLES FILE NUMBER
  S @ZFARY@("C0XSFN")=172.201 ; TRIPLES STRINGS FILE NUMBER
  S @ZFARY@("C0XTN")=$NA(^C0X(101)) ; TRIPLES GLOBAL NAME
  S @ZFARY@("C0XSN")=$NA(^C0X(201)) ; STRING FILE GLOBAL NAME
- S @ZFARY@("C0XDIR")="/home/glilly/fmts/trunk/samples/qds/"
+ S @ZFARY@("C0XDIR")="/home/glilly/fmts/trunk/samples/"
  S @ZFARY@("BLKLOAD")=1 ; this file supports block load
  S @ZFARY@("FMTSSTYLE")="F2N" ; fileman style
@@ -71,11 +72,12 @@
  S C0XFN=Y
  D IMPORT(C0XFN,C0XDIR,,"C0XFARY")
- Q
- ;
-IMPORT(FNAME,FDIR,FURL,FARY) ; EXTRINSIC THAT READS A FILE FROM THE STANDARD 
+ K C0XFDA
+ Q
+ ;
+IMPORT(FNAME,INDIR,INURL,FARY) ; EXTRINSIC THAT READS A FILE FROM THE STANDARD 
  ; DIRECTORY, LOADS IT INTO THE TRIPLESTORE AS TEXT, AND RETURNS THE
  ; NODE NAME OF THE TEXT TRIPLE
- ; FDIR IS THE OPTIONAL DIRECTORY (DEFAUTS TO STANDARD DIR)
- ; FURL IS THE OPTIONAL URI FOR ACCESSING THE FILE FROM THE TRIPLE STORE
+ ; INDIR IS THE OPTIONAL DIRECTORY (DEFAUTS TO STANDARD DIR)
+ ; INURL IS THE OPTIONAL URI FOR ACCESSING THE FILE FROM THE TRIPLE STORE
  ; FARY IS THE OPTIONAL FILE ARRAY OF THE TRIPLE STORE TO USE
  I '$D(FARY) D  ;
@@ -84,8 +86,9 @@
  D USEFARY(FARY)
  N ZD,ZTMP
- I '$D(FDIR) S FDIR=C0XDIR ; DIRECTORY OF THE RDF FILE
- I '$D(FURL) D  ;
- . N ZN2 S ZN2=$TR(FNAME,".","_") ; REMOVE THE DOT FROM THE NAME
- . S FURL=FDIR_ZN2
+ I '$D(INDIR) S INDIR=C0XDIR ; DIRECTORY OF THE RDF FILE
+ I $G(INURL)="" D  ;
+ . ;N ZN2 S ZN2=$P(FNAME,".",1)_"_"_$P(FNAME,".",2) ; REMOVE THE DOT 
+ . ;S INURL=FDIR_ZN2
+ . S INURL=INDIR_FNAME
  N ZTMP
  S ZTMP=$NA(^TMP("C0X",$J,"FILEIN",1)) ; WHERE TO PUT THE INCOMING FILE
@@ -94,9 +97,12 @@
  W !,"STARTED: ",C0XSTART
  W !,"READING IN: ",FNAME
- I '$$FILEREAD(ZTMP,FDIR,FNAME,4) D  Q  ; QUIT IF NO SUCCESS
- . W !,"ERROR READING FILE: ",FDIR,FNAME 
+ I '$$FILEREAD(ZTMP,INDIR,FNAME,4) D  Q  ; QUIT IF NO SUCCESS
+ . W !,"ERROR READING FILE: ",INDIR,FNAME 
  S ZRDF=$NA(^TMP("C0X",$J,"FILEIN")) ; WITHOUT THE SUBSCRIPT
  W !,$O(@ZRDF@(""),-1)," LINES READ"
- D INSRDF(ZRDF,FURL,FARY) ; IMPORT AND PROCESS THE RDF
+ D INSRDF(ZRDF,INURL,FARY) ; IMPORT AND PROCESS THE RDF
+ K INURL
+ K C0XFDA
+ K ^TMP("MXMLDOM",$J)
  Q
  ;
@@ -132,4 +138,6 @@
  . S FARY="C0XFARY"
  D USEFARY(FARY)
+ S BATCNT=0 ; BATCH COUNTER
+ S BATMAX=10000 ; TRY BATCHES OF THIS SIZE
  N ZGRAPH,ZSUBJECT
  S ZGRAPH="_:G"_$$LKY9 ; RANDOM GRAPH NAME
@@ -139,9 +147,9 @@
  S ZTXTNM="_TXT_INCOMING_RDF_FILE_"_ZNAME_"_"_$$LKY9 ; NAME FOR TEXT NODE
  D ADD(ZGRAPH,ZSUBJECT,"fmts:rdfSource",ZTXTNM,FARY)
- D UPDIE(.C0XFDA) ; TRY IT OUT
+ D SWUPDIE(.C0XFDA) ; TRY IT OUT
  K C0XCNT ;RESET FOR NEXT TIME
  D STORETXT(ZRDF,ZTXTNM,FARY)
  W !,"ADDED: ",ZGRAPH," ",ZSUBJECT," fmts:rdfSource ",ZTXTNM
- D PROCESS2(.G,ZRDF,ZNAME,ZGRAPH,FARY) ; PARSE AND INSERT THE RDF
+ D PROCESS(.G,ZRDF,ZNAME,ZGRAPH,FARY) ; PARSE AND INSERT THE RDF
  Q
  ;
@@ -207,10 +215,21 @@
  . S FARY="C0XFARY"
  D USEFARY(FARY)
+ ;N BATCNT
+ ;N BATMAX
  ; -- first parse the rdf file with the MXML parser
  ;S C0XDOCID=$$PARSE^C0CNHIN(ZRDF,"C0XARRAY") ; PARSE WITH MXML
+ S C0XDLC2=$$NOW^XLFDT ; START OF PARSE
  S C0XDOCID=$$EN^MXMLDOM(ZRDF,"W")
+ K @ZRDF ; DON'T NEED INPUT BUFFER ANYMORE
  ; -- assign the MXLM dom global name to ZDOM
  S ZDOM=$NA(^TMP("MXMLDOM",$J,C0XDOCID))
- W !,$O(@ZDOM@(""),-1)," XML NODES PARSED"
+ S C0XNODE=$O(@ZDOM@(""),-1)
+ W !,C0XNODE," XML NODES PARSED"
+ S C0XPRS=$$NOW^XLFDT ; PARSE COMPLETE
+ W !,"PARSE COMPLETE AT ",C0XPRS
+ S C0XDIFF=$$FMDIFF^XLFDT(C0XPRS,C0XDLC2,2)
+ W !," ELAPSED TIME: ",C0XDIFF," SECONDS"
+ I C0XDIFF'=0 D  ;
+ . W !," APPROXIMATELY ",$P(C0XNODE/C0XDIFF,".")," NODES PER SECOND"
  ; -- populate the metagraph to point to the graph with status unfinished
  S METAS=$$ANONS ; GET AN ANONOMOUS RANDOM SUBJECT
@@ -218,8 +237,9 @@
  D ADD(ZMETA,METAS,"fmts:about",ZGRF,FARY) ; POINT THE META TO THE GRAPH
  D ADD(ZMETA,METAS,"fmts:status","unfinished",FARY) ; mark as unfinished
+ W !,"INSERTING GRAPH: ",ZGRF
  ;S C0XDATE=$$FMDTOUTC^C0CUTIL($$NOW^XLFDT,"DT")
  S C0XDATE=$$NOW^XLFDT
  D ADD(ZMETA,METAS,"fmts:dateTime",C0XDATE,FARY)
- D UPDIE(.C0XFDA) ; commit the metagraph changes to the triple store
+ D SWUPDIE(.C0XFDA) ; commit the metagraph changes to the triple store
  ; -- 
  ; -- pull out the vocabularies in the RDF statement. marked with xmlns:
@@ -288,118 +308,4 @@
  . . . W !,"ERROR, NO OBJECT FOUND FOR NODE: ",ZJ
  . . D ADD(ZGRF,C0XSUB,C0XPRE,C0XOBJ) ; go for it and add a node
- W !,"INSERTING ",C0XCNT," TRIPLES"
- D UPDIE(.C0XFDA) ; commit the updates to the file
- ; next, mark the graph as finished
- S C0XEND=$$NOW^XLFDT
- W !," ENDED AT: ",C0XEND
- S C0XDIFF=$$FMDIFF^XLFDT(C0XEND,C0XSTART,2)
- W !," ELAPSED TIME: ",C0XDIFF," SECONDS"
- I C0XDIFF'=0 D  ;
- . W !," APPROXIMATELY ",$P(C0XCNT/C0XDIFF,".")," TRIPLES PER SECOND"
- Q
- ;
-PROCESS2(ZRTN,ZRDF,ZGRF,ZMETA,FARY) ; PROCESS AN INCOMING RDF FILE
- ; ZRTN IS PASS BY REFERENCE AND RETURNS MESSAGES ABOUT THE PROCESSING
- ; ZRDF IS PASSED BY NAME AND IS THE GLOBAL CONTAINING THE RDF FILE
- ; ZGRF IS THE NAME OF THE GRAPH TO USE IN THE TRIPLE STORE FOR RESULTS
- ; ZMETA IS OPTIONAL AND IS THE NAME OF THE GRAPH TO STORE METADATA
- ;
- I '$D(FARY) D  ;
- . D INITFARY("C0XFARY")
- . S FARY="C0XFARY"
- D USEFARY(FARY)
- ;N BATCNT
- ;N BATMAX
- S BATCNT=0 ; BATCH COUNTER
- S BATMAX=10000 ; TRY BATCHES OF THIS SIZE
- ; -- first parse the rdf file with the MXML parser
- ;S C0XDOCID=$$PARSE^C0CNHIN(ZRDF,"C0XARRAY") ; PARSE WITH MXML
- S C0XDLC2=$$NOW^XLFDT ; START OF PARSE
- S C0XDOCID=$$EN^MXMLDOM(ZRDF,"W")
- ; -- assign the MXLM dom global name to ZDOM
- S ZDOM=$NA(^TMP("MXMLDOM",$J,C0XDOCID))
- S C0XNODE=$O(@ZDOM@(""),-1)
- W !,C0XNODE," XML NODES PARSED"
- S C0XPRS=$$NOW^XLFDT ; PARSE COMPLETE
- W !,"PARSE COMPLETE AT ",C0XPRS
- S C0XDIFF=$$FMDIFF^XLFDT(C0XPRS,C0XDLC2,2)
- W !," ELAPSED TIME: ",C0XDIFF," SECONDS"
- I C0XDIFF'=0 D  ;
- . W !," APPROXIMATELY ",$P(C0XNODE/C0XDIFF,".")," NODES PER SECOND"
- ; -- populate the metagraph to point to the graph with status unfinished
- S METAS=$$ANONS ; GET AN ANONOMOUS RANDOM SUBJECT
- I '$D(ZMETA) S ZMETA="_:G"_$$LKY9 ; RANDOM GRAPH NAME FOR METAGRAPH
- D ADD(ZMETA,METAS,"fmts:about",ZGRF,FARY) ; POINT THE META TO THE GRAPH
- D ADD(ZMETA,METAS,"fmts:status","unfinished",FARY) ; mark as unfinished
- ;S C0XDATE=$$FMDTOUTC^C0CUTIL($$NOW^XLFDT,"DT")
- S C0XDATE=$$NOW^XLFDT
- D ADD(ZMETA,METAS,"fmts:dateTime",C0XDATE,FARY)
- D UPDIE(.C0XFDA) ; commit the metagraph changes to the triple store
- ; -- 
- ; -- pull out the vocabularies in the RDF statement. marked with xmlns:
- ; -- put them in a local variable for quick reference
- ; -- TODO: create a graph for vocabularies and validate incoming against it
- ;
- S C0XVOC=""
- N ZI,ZJ,ZK S ZI=""
- F  S ZI=$O(@ZDOM@(1,"A",ZI)) Q:ZI=""  D  ; FOR EACH xmlns
- . S ZVOC=$P(ZI,"xmlns:",2)
- . I ZVOC'="" S C0XVOC(ZVOC)=$G(@ZDOM@(1,"A",ZI))
- ;W !,"VOCABS:" ZWR C0XVOC
- ;
- ; -- look for children called rdf:Description. quit if none. not an rdf file
- ;
- S ZI=$O(@ZDOM@(1,"C",""))
- I $G(@ZDOM@(1,"C",ZI))'="rdf:Description" D  Q  ; not an rdf file
- . W !,"Error. Not an RDF file. Cannot process."
- ;
- ; -- now process the rdf description children
- ;
- S ZI=""
- S (C0XSUB,C0XPRE,C0XOBJ)="" ; INITIALIZE subject, object and predicate
- F  S ZI=$O(@ZDOM@(1,"C",ZI)) Q:ZI=""  D  ;
- . ; -- we are skipping any child that is not rdf:Description
- . ; -- TODO: check to see if this is right in general
- . ;
- . IF $G(@ZDOM@(1,"C",ZI))'="rdf:Description" D  Q  ;
- . . W !,"SKIPPING NODE: ",ZI
- . ; -- now looking for the subject for the triples
- . S ZX=$G(@ZDOM@(ZI,"A","rdf:about"))
- . I ZX'="" D  ; we have the subject
- . . ;W " about: ",ZX
- . . S C0XSUB=ZX
- . E  D  ;
- . . S ZX=$G(@ZDOM@(ZI,"A","rdf:nodeID")) ; node id is another style of subject
- . . I ZX'="" D  ;
- . . . S C0XSUB=ZX
- . I C0XSUB="" S C0XSUB=$$ANONS ; DEFAULT TO BLANK SUBJECT
- . ; 
- . ; -- we now have the subject. the children of this node have the rest
- . ;
- . S ZJ="" ; for the children of the rdf:Description nodes
- . F  S ZJ=$O(@ZDOM@(ZI,"C",ZJ)) Q:ZJ=""  D  ; for each child
- . . S C0XPRE=@ZDOM@(ZJ) ; the predicate without a prefix
- . . S ZX=$G(@ZDOM@(ZJ,"A","xmlns")) ; name space
- . . I ZX'="" S C0XPRE=ZX_C0XPRE ; add the namespace prefix
- . . I C0XPRE[":" D  ; expand using vocabulary
- . . . N ZB,ZA
- . . . S ZB=$P(C0XPRE,":",1)
- . . . S ZA=$P(C0XPRE,":",2)
- . . . I $G(C0XVOC(ZB))'="" D  ;
- . . . . S C0XPRE=C0XVOC(ZB)_ZA ; expanded 
- . . S ZY=$G(@ZDOM@(ZJ,"A","rdf:resource")) ; potential object
- . . I ZY'="" D  Q ; 
- . . . S C0XOBJ=ZY ; object
- . . . D ADD2(ZGRF,C0XSUB,C0XPRE,C0XOBJ) ; finally. our first real triple
- . . ; -- this is an else because of the quit above
- . . S ZX=$G(@ZDOM@(ZJ,"A","rdf:nodeID")) ; fishing for nodeId object
- . . I ZX'="" D  Q  ; got one
- . . . S C0XOBJ=ZX ; we are using the incoming nodeIDs as object/subject 
- . . . ; without change... this could be foolish .. look at it again later
- . . . D ADD2(ZGRF,C0XSUB,C0XPRE,C0XOBJ) ; go for it and add a node
- . . S C0XOBJ=$G(@ZDOM@(ZJ,"T",1)) ; hopefully an object is here
- . . I C0XOBJ="" D  Q  ; not a happy situation
- . . . W !,"ERROR, NO OBJECT FOUND FOR NODE: ",ZJ
- . . D ADD2(ZGRF,C0XSUB,C0XPRE,C0XOBJ) ; go for it and add a node
  S C0XTRP=$$NOW^XLFDT ; PARSE COMPLETE
  W !,"TRIPLES COMPLETE AT ",C0XTRP
@@ -419,10 +325,10 @@
  S C0XDIFF=$$FMDIFF^XLFDT(C0XINS,C0XTRP,2)
  W !," ELAPSED TIME: ",C0XDIFF," SECONDS"
- W !," APPROXIMATELY ",$P(C0XCNT/C0XDIFF,".")," NODES PER SECOND"
+ I C0XDIFF'=0 W !," APPROXIMATELY ",$P(C0XCNT/C0XDIFF,".")," NODES PER SECOND"
  S C0XEND=$$NOW^XLFDT
  W !," ENDED AT: ",C0XEND
  S C0XDIFF=$$FMDIFF^XLFDT(C0XEND,C0XSTART,2)
  W !," ELAPSED TIME: ",C0XDIFF," SECONDS"
- W !," APPROXIMATELY ",$P(C0XCNT/C0XDIFF,".")," TRIPLES PER SECOND"
+ I C0XDIFF'=0 W !," APPROXIMATELY ",$P(C0XCNT/C0XDIFF,".")," TRIPLES PER SECOND"
  Q
  ;
@@ -432,5 +338,5 @@
  ;
 ANONS() ; RETURNS AN ANONOMOUS SUBJECT
- Q "_S:"_$$LKY9
+ Q "_:S"_$$LKY9
  ;
 NEWG(NGRAPH,NMETA) ; CREATES A NEW META GRAPH, MARKS IT AS UNFINISHED
@@ -442,33 +348,4 @@
  ;
 ADD(ZG,ZS,ZP,ZO,FARY) ; ADD A TRIPLE TO THE TRIPLESTORE. ALL VALUES ARE TEXT
- ; THE FDA IS SET UP BUT THE FILES ARE NOT UPDATED. CALL UPDIE TO COMPLETE
- I '$D(FARY) D  ;
- . D INITFARY("C0XFARY")
- . S FARY="C0XFARY"
- D USEFARY(FARY)
- I '$D(C0XCNT) S C0XCNT=0
- N ZNODE
- S ZNODE="N"_$$LKY17
- N ZNARY ; GET READY TO CALL IENOFA
- S ZNARY("ZG",ZG)=""
- S ZNARY("ZS",ZS)=""
- S ZNARY("ZP",ZP)=""
- S ZNARY("ZO",ZO)=""
- D IENOFA(.ZIENS,.ZNARY,FARY) ; RESOLVE/ADD STRINGS
- ;S ZGIEN=$$IENOF(ZG) ; LAYGO TO GET IEN
- ;S ZSIEN=$$IENOF(ZS)
- ;S ZPIEN=$$IENOF(ZP)
- ;S ZOIEN=$$IENOF(ZO)
- ;I $D(C0XFDA) D UPDIE ; ADD THE STRINGS IF NEEDED
- S C0XCNT=C0XCNT+1
- S C0XFDA(C0XTFN,"?+"_C0XCNT_",",.01)=ZNODE
- S C0XFDA(C0XTFN,"?+"_C0XCNT_",",.02)=$O(ZIENS("IEN","ZG",""))
- S C0XFDA(C0XTFN,"?+"_C0XCNT_",",.03)=$O(ZIENS("IEN","ZS",""))
- S C0XFDA(C0XTFN,"?+"_C0XCNT_",",.04)=$O(ZIENS("IEN","ZP",""))
- S C0XFDA(C0XTFN,"?+"_C0XCNT_",",.05)=$O(ZIENS("IEN","ZO",""))
- ; REMEMBER TO CALL UPDIE WHEN YOU'RE DONE
- Q
- ;
-ADD2(ZG,ZS,ZP,ZO,FARY) ; ADD A TRIPLE TO THE TRIPLESTORE. ALL VALUES ARE TEXT
  ; THE FDA IS SET UP BUT THE FILES ARE NOT UPDATED. CALL UPDIE TO COMPLETE
  I '$D(FARY) D  ;
@@ -637,4 +514,12 @@
  Q
  ;
+SWUPDIE(ZFDA) ; SWITCH BETWEEN UPDIE AND BULKLOAD
+ . I $G(BLKLOAD) D  ; bulk load
+ . . D BULKLOAD(.ZFDA) ; bulk load the batch
+ . E  D  ; no bulk load
+ . . D UPDIE(.ZFDA)
+ . K ZFDA
+ Q
+ ; 
 UPDIE(ZFDA) ; INTERNAL ROUTINE TO CALL UPDATE^DIE AND CHECK FOR ERRORS
  ; ZFDA IS PASSED BY REFERENCE
Index: fmts/trunk/p/C0XINIT.m
===================================================================
--- fmts/trunk/p/C0XINIT.m	(revision 1294)
+++ fmts/trunk/p/C0XINIT.m	(revision 1294)
@@ -0,0 +1,116 @@
+C0XINIT ; GPL - Fileman Triples initialization routine ;10/13/11  17:05
+ ;;0.1;C0X;nopatch;noreleasedate;Build 5
+ ;Copyright 2011 George Lilly.  Licensed under the terms of the GNU
+ ;General Public License See attached copy of the License.
+ ;
+ ;This program is free software; you can redistribute it and/or modify
+ ;it under the terms of the GNU General Public License as published by
+ ;the Free Software Foundation; either version 2 of the License, or
+ ;(at your option) any later version.
+ ;
+ ;This program is distributed in the hope that it will be useful,
+ ;but WITHOUT ANY WARRANTY; without even the implied warranty of
+ ;MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ ;GNU General Public License for more details.
+ ;
+ ;You should have received a copy of the GNU General Public License along
+ ;with this program; if not, write to the Free Software Foundation, Inc.,
+ ;51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
+ ;
+ Q
+ ;
+CLEAR ; DELETE THE FILESTORE
+ K ^C0X
+ S ^C0X(101,0)="C0X TRIPLE^172.101I^^"
+ S ^C0X(201,0)="C0X STRING^172.201I^^"
+ Q
+ ;
+INIT ; INITIALIZE THE TRIPLE STORE - THIS DELETES THE GLOBALS AND
+ ; START ALL OVER... USE WITH CAUTION
+ ;
+ ; -- we should be more sophisticated here.. at least warn the user
+ ; -- and give them a chance to cancel
+ ;
+ D CLEAR ; DELETE THE TRIPLESTORE
+ ;
+ ; -- we are assuming that FARY is set up properly in C0XF2N
+ ; -- with repect to the default directory and the defaut fileman files
+ ; -- here's what it is now: "/home/glilly/fmts/trunk/samples/"
+ ; -- that means that all the sample files will look like:
+ ; --- qds/QDS_0001.rdf
+ ; --- smart-rdf-in/small.rdf
+ ;
+ S FARY="C0XFARY"
+ D INITFARY^C0XF2N(FARY)
+ D USEFARY^C0XF2N(FARY)
+ S C0XFARY("C0XDIR")="/home/glilly/fmts/trunk/samples/smart-rdf-in/" ; 
+ D USEFARY^C0XF2N(FARY)
+ S SMART(1)="cole-susan.rdf"
+ S SMART(2)="jones-cynthia.rdf"
+ S SMART(3)="small.rdf"
+ S SMART(4)="collins-frank.rdf"
+ S SMART(5)="kelly-david.rdf"
+ S SMART(6)="smith-maria.rdf"
+ S SMART(7)="ford-shirley.rdf"
+ S SMART(8)="morgan-jason.rdf"
+ S SMART(9)="west-lisa.rdf"
+ S SMART(10)="gracia-paul.rdf"
+ S SMART(11)="reed-richard.rdf"
+ S SMART(12)="west-sandra.rdf"
+ S SMART(13)="jackson-jessica.rdf"
+ S SMART(14)="small-allergies.rdf"
+ S SMART(15)="white-patricia.rdf"
+ N ZI S ZI=""
+ F  S ZI=$O(SMART(ZI)) Q:ZI=""  D  ; for each smart file
+ . D IMPORT^C0XF2N(SMART(ZI),C0XDIR,,FARY) ; import to the triplestore
+ S FARY="C0XFARY"
+ S C0XFARY("C0XDIR")="/home/glilly/fmts/trunk/samples/qds/"
+ D USEFARY^C0XF2N(FARY)
+ D IMPORT^C0XF2N("QDS_0001.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0028b.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0052.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0073.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0385.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0002.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0031.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0055.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0074.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0387.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0004.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0032.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0056.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0075.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0389.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0012.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0033.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0059.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0081.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0421.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0013.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0034.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0061.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0083.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0575.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0014.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0036.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0062.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0084.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0018.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0038.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0064.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0086.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0024.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0041.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0067.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0088.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0027.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0043.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0068.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0089.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0028a.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0047.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0070.rdf",C0XDIR,,FARY)
+ D IMPORT^C0XF2N("QDS_0105.rdf",C0XDIR,,FARY)
+ ;D IMPORT^C0XF2N("qds.rdf",C0XDIR,,FARY)
+ Q
+ ;
Index: fmts/trunk/p/C0XMAIN.m
===================================================================
--- fmts/trunk/p/C0XMAIN.m	(revision 1281)
+++ fmts/trunk/p/C0XMAIN.m	(revision 1294)
@@ -1,516 +1,377 @@
-C0XMAIN ; GPL - Fileman Triples entry point routine ;10/13/11  17:05
- ;;0.1;C0X;nopatch;noreleasedate;Build 1
- ;Copyright 2011 George Lilly.  Licensed under the terms of the GNU
- ;General Public License See attached copy of the License.
- ;
- ;This program is free software; you can redistribute it and/or modify
- ;it under the terms of the GNU General Public License as published by
- ;the Free Software Foundation; either version 2 of the License, or
- ;(at your option) any later version.
- ;
- ;This program is distributed in the hope that it will be useful,
- ;but WITHOUT ANY WARRANTY; without even the implied warranty of
- ;MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
- ;GNU General Public License for more details.
- ;
- ;You should have received a copy of the GNU General Public License along
- ;with this program; if not, write to the Free Software Foundation, Inc.,
- ;51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
- ;
- Q
- ;
-INITFARY(ZFARY) ; INITIALIZE FILE NUMBERS AND OTHER USEFUL THINGS
- ; FOR THE DEFAULT TRIPLE STORE. USE OTHER VALUES FOR SUPPORTING ADDITIONAL
- ; TRIPLE STORES
- S @ZFARY@("C0XTFN")=172.101 ; TRIPLES FILE NUMBER
- S @ZFARY@("C0XSFN")=172.201 ; TRIPLES STRINGS FILE NUMBER
- S @ZFARY@("C0XTN")=$NA(^C0X(101)) ; TRIPLES GLOBAL NAME
- S @ZFARY@("C0XSN")=$NA(^C0X(201)) ; STRING FILE GLOBAL NAME
- S @ZFARY@("C0XDIR")="/home/glilly/all_smart_patient_data/smart-rdf/"
- D USEFARY(ZFARY)
- Q
- ;
-USEFARY(ZFARY) ; INITIALIZES VARIABLES SAVED IN ARRAY ZFARY
- N ZI S ZI=""
- F  S ZI=$O(@ZFARY@(ZI)) Q:ZI=""  D  
- . ;N ZX
- . S ZX="S "_ZI_"="""_@ZFARY@(ZI)_""""
- . ;W !,ZX
- . X ZX
- Q
- ;
-IMPORT(FNAME,FDIR,FURL,FARY) ; EXTRINSIC THAT READS A FILE FROM THE STANDARD 
- ; DIRECTORY, LOADS IT INTO THE TRIPLESTORE AS TEXT, AND RETURNS THE
- ; NODE NAME OF THE TEXT TRIPLE
- ; FDIR IS THE OPTIONAL DIRECTORY (DEFAUTS TO STANDARD DIR)
- ; FURL IS THE OPTIONAL URI FOR ACCESSING THE FILE FROM THE TRIPLE STORE
- ; FARY IS THE OPTIONAL FILE ARRAY OF THE TRIPLE STORE TO USE
- I '$D(FARY) D  ;
- . D INITFARY("C0XFARY")
- . S FARY="C0XFARY"
- D USEFARY(FARY)
- N ZD,ZTMP
- I '$D(FDIR) S FDIR=C0XDIR ; DIRECTORY OF THE RDF FILE
- I '$D(FURL) D  ;
- . N ZN2 S ZN2=$TR(FNAME,".","_") ; REMOVE THE DOT FROM THE NAME
- . S FURL=FDIR_ZN2
- N ZTMP
- S ZTMP=$NA(^TMP("C0X",$J,"FILEIN",1)) ; WHERE TO PUT THE INCOMING FILE
- K @ZTMP ; MAKE SURE IT'S CLEAR
- S C0XSTART=$$NOW^XLFDT
- W !,"STARTED: ",C0XSTART
- W !,"READING IN: ",FNAME
- I '$$FILEIN(ZTMP,FDIR,FNAME,4) D  Q  ; QUIT IF NO SUCCESS
- . W !,"ERROR READING FILE: ",FDIR,FNAME 
- S ZRDF=$NA(^TMP("C0X",$J,"FILEIN")) ; WITHOUT THE SUBSCRIPT
- W !,$O(@ZRDF@(""),-1)," LINES READ"
- D INSRDF(ZRDF,FURL,FARY) ; IMPORT AND PROCESS THE RDF
- Q
- ;
-WGET(ZURL,FARY) ; GET FROM THE INTERNET AN RDF FILE AND INSERT IT
- ;
- I '$D(FARY) D  ;
- . D INITFARY("C0XFARY")
- . S FARY="C0XFARY"
- D USEFARY(FARY)
- ;N ZLOC,ZTMP
- K ZTMP
- S ZLOC=$NA(^TMP("C0X","WGET",$J))
- K @ZLOC
- S C0XSTART=$$NOW^XLFDT
- W !,"STARTED: ",C0XSTART
- W !,"DOWNLOADING: ",ZURL
- S OK=$$httpGET^%zewdGTM(ZURL,.ZTMP)
- M @ZLOC=ZTMP
- W !,$O(@ZLOC@(""),-1)," LINES READ"
- D INSRDF(ZLOC,ZURL,FARY)
- Q
- ;
-INSRDF(ZRDF,ZNAME,FARY) ; INSERT AN RDF FILE INTO THE STORE AND PROCESS
- ; ZRDF IS PASSED BY NAME
- I '$D(FARY) D  ;
- . D INITFARY("C0XFARY")
- . S FARY="C0XFARY"
- D USEFARY(FARY)
- N ZGRAPH,ZSUBJECT
- S ZGRAPH="_:G"_$$LKY9 ; RANDOM GRAPH NAME
- S ZSUBJECT=$$ANONS ; RANDOM ANOYMOUS SUBJECT
- D ADD(ZGRAPH,ZSUBJECT,"fmts:url",ZNAME,FARY)
- N ZTXTNM
- S ZTXTNM="_TXT_INCOMING_RDF_FILE_"_ZNAME_"_"_$$LKY9 ; NAME FOR TEXT NODE
- D ADD(ZGRAPH,ZSUBJECT,"fmts:rdfSource",ZTXTNM,FARY)
- D UPDIE(.C0XFDA) ; TRY IT OUT
- K C0XCNT ;RESET FOR NEXT TIME
- D STORETXT(ZRDF,ZTXTNM,FARY)
- W !,"ADDED: ",ZGRAPH," ",ZSUBJECT," fmts:rdfSource ",ZTXTNM
- D PROCESS2(.G,ZRDF,ZNAME,ZGRAPH,FARY) ; PARSE AND INSERT THE RDF
- Q
- ;
-STORETXT(ZTXT,ZNAME,FARY) ; STORE TEXT IN THE TRIPLESTORE AT ZNAME
- ;
- I '$D(FARY) D  ;
- . D INITFARY("C0XFARY")
- . S FARY="C0XFARY"
- D USEFARY(FARY)
- N ZIEN
- S ZIEN=$$IENOF(ZNAME,FARY) ; GET THE IEN
- D CLEAN^DILF
- K ZERR
- D WP^DIE(C0XSFN,ZIEN_",",1,,ZTXT,"ZERR")
- I $D(ZERR) D  ;
- . ZWR ZERR
- Q
- ; 
-GETTXT(ZRTN,ZNAME,FARY) ; RETURNS RDF SOURCE OR OTHER TEXT
- ; ZRTN IS PASSED BY REFERENCE
- I '$D(FARY) D  ;
- . D INITFARY("C0XFARY")
- . S FARY="C0XFARY"
- D USEFARY(FARY)
- N ZIEN
- S ZIEN=$$IENOF(ZNAME)
- S OK=$$GET1^DIQ(C0XSFN,ZIEN_",",1,,"ZRTN")
- Q
- ;
-WHERETXT(ZNAME,FARY) ; EXTRINSIC WHICH RETURNS THE NAME OF THE GLOBAL
- ; WHERE THE TEXT IS LOCATED. NAME IS THE NAME OF THE STRING
- I '$D(FARY) D  ;
- . D INITFARY("C0XFARY")
- . S FARY="C0XFARY"
- D USEFARY(FARY)
- N ZIEN
- S ZIEN=$$IENOF(ZNAME)
- Q $NA(@C0XSN@(ZIEN,1))
- ;
-FILEIN(ZINTMP,ZDIR,ZFNAME,ZLVL) ; READS A FILE INTO ZINTMP USING FTG^%ZISH
- ; ZINTMP IS PASSED BY NAME AND INCLUDES THE NEW SUBSCRIPT
- ; IE ^TMP("C0X","FILEIN",1)
- ; ZLVL IN THIS CASE WOULD BE 3 INCREMENTING THE 1
- ; EXTRINSIC WHICH RETURNS THE RESULT OF FTG^%ZISH
- S OK=$$FTG^%ZISH(ZDIR,FNAME,ZINTMP,ZLVL)
- Q OK
- ;
-TESTPROC ; TEST PROCESS WITH EXISTING SMALL RDF FILE
- S ZIN=$NA(^TMP("C0X",12226,"FILEIN"))
- S ZGRAPH="/test/rdfFile"
- S ZM="/test/rdfFile/meta"
- D PROCESS(.G,ZIN,ZGRAPH,ZM)
- Q
- ;
-PROCESS(ZRTN,ZRDF,ZGRF,ZMETA,FARY) ; PROCESS AN INCOMING RDF FILE
- ; ZRTN IS PASS BY REFERENCE AND RETURNS MESSAGES ABOUT THE PROCESSING
- ; ZRDF IS PASSED BY NAME AND IS THE GLOBAL CONTAINING THE RDF FILE
- ; ZGRF IS THE NAME OF THE GRAPH TO USE IN THE TRIPLE STORE FOR RESULTS
- ; ZMETA IS OPTIONAL AND IS THE NAME OF THE GRAPH TO STORE METADATA
- ;
- I '$D(FARY) D  ;
- . D INITFARY("C0XFARY")
- . S FARY="C0XFARY"
- D USEFARY(FARY)
- ; -- first parse the rdf file with the MXML parser
- ;S C0XDOCID=$$PARSE^C0CNHIN(ZRDF,"C0XARRAY") ; PARSE WITH MXML
- S C0XDOCID=$$EN^MXMLDOM(ZRDF,"W")
- ; -- assign the MXLM dom global name to ZDOM
- S ZDOM=$NA(^TMP("MXMLDOM",$J,C0XDOCID))
- W !,$O(@ZDOM@(""),-1)," XML NODES PARSED"
- ; -- populate the metagraph to point to the graph with status unfinished
- S METAS=$$ANONS ; GET AN ANONOMOUS RANDOM SUBJECT
- I '$D(ZMETA) S ZMETA="_:G"_$$LKY9 ; RANDOM GRAPH NAME FOR METAGRAPH
- D ADD(ZMETA,METAS,"fmts:about",ZGRF,FARY) ; POINT THE META TO THE GRAPH
- D ADD(ZMETA,METAS,"fmts:status","unfinished",FARY) ; mark as unfinished
- ;S C0XDATE=$$FMDTOUTC^C0CUTIL($$NOW^XLFDT,"DT")
- S C0XDATE=$$NOW^XLFDT
- D ADD(ZMETA,METAS,"fmts:dateTime",C0XDATE,FARY)
- D UPDIE(.C0XFDA) ; commit the metagraph changes to the triple store
- ; -- 
- ; -- pull out the vocabularies in the RDF statement. marked with xmlns:
- ; -- put them in a local variable for quick reference
- ; -- TODO: create a graph for vocabularies and validate incoming against it
- ;
- S C0XVOC=""
- N ZI,ZJ,ZK S ZI=""
- F  S ZI=$O(@ZDOM@(1,"A",ZI)) Q:ZI=""  D  ; FOR EACH xmlns
- . S ZVOC=$P(ZI,"xmlns:",2)
- . I ZVOC'="" S C0XVOC(ZVOC)=$G(@ZDOM@(1,"A",ZI))
- ;W !,"VOCABS:" ZWR C0XVOC
- ;
- ; -- look for children called rdf:Description. quit if none. not an rdf file
- ;
- S ZI=$O(@ZDOM@(1,"C",""))
- I $G(@ZDOM@(1,"C",ZI))'="rdf:Description" D  Q  ; not an rdf file
- . W !,"Error. Not an RDF file. Cannot process."
- ;
- ; -- now process the rdf description children
- ;
- S ZI=""
- S (C0XSUB,C0XPRE,C0XOBJ)="" ; INITIALIZE subject, object and predicate
- F  S ZI=$O(@ZDOM@(1,"C",ZI)) Q:ZI=""  D  ;
- . ; -- we are skipping any child that is not rdf:Description
- . ; -- TODO: check to see if this is right in general
- . ;
- . IF $G(@ZDOM@(1,"C",ZI))'="rdf:Description" D  Q  ;
- . . W !,"SKIPPING NODE: ",ZI
- . ; -- now looking for the subject for the triples
- . S ZX=$G(@ZDOM@(ZI,"A","rdf:about"))
- . I ZX'="" D  ; we have the subject
- . . ;W " about: ",ZX
- . . S C0XSUB=ZX
- . E  D  ;
- . . S ZX=$G(@ZDOM@(ZI,"A","rdf:nodeID")) ; node id is another style of subject
- . . I ZX'="" D  ;
- . . . S C0XSUB=ZX
- . I C0XSUB="" S C0XSUB=$$ANONS ; DEFAULT TO BLANK SUBJECT
- . ; 
- . ; -- we now have the subject. the children of this node have the rest
- . ;
- . S ZJ="" ; for the children of the rdf:Description nodes
- . F  S ZJ=$O(@ZDOM@(ZI,"C",ZJ)) Q:ZJ=""  D  ; for each child
- . . S C0XPRE=@ZDOM@(ZJ) ; the predicate without a prefix
- . . S ZX=$G(@ZDOM@(ZJ,"A","xmlns")) ; name space
- . . I ZX'="" S C0XPRE=ZX_C0XPRE ; add the namespace prefix
- . . I C0XPRE[":" D  ; expand using vocabulary
- . . . N ZB,ZA
- . . . S ZB=$P(C0XPRE,":",1)
- . . . S ZA=$P(C0XPRE,":",2)
- . . . I $G(C0XVOC(ZB))'="" D  ;
- . . . . S C0XPRE=C0XVOC(ZB)_ZA ; expanded 
- . . S ZY=$G(@ZDOM@(ZJ,"A","rdf:resource")) ; potential object
- . . I ZY'="" D  Q ; 
- . . . S C0XOBJ=ZY ; object
- . . . D ADD(ZGRF,C0XSUB,C0XPRE,C0XOBJ) ; finally. our first real triple
- . . ; -- this is an else because of the quit above
- . . S ZX=$G(@ZDOM@(ZJ,"A","rdf:nodeID")) ; fishing for nodeId object
- . . I ZX'="" D  Q  ; got one
- . . . S C0XOBJ=ZX ; we are using the incoming nodeIDs as object/subject 
- . . . ; without change... this could be foolish .. look at it again later
- . . . D ADD(ZGRF,C0XSUB,C0XPRE,C0XOBJ) ; go for it and add a node
- . . S C0XOBJ=$G(@ZDOM@(ZJ,"T",1)) ; hopefully an object is here
- . . I C0XOBJ="" D  Q  ; not a happy situation
- . . . W !,"ERROR, NO OBJECT FOUND FOR NODE: ",ZJ
- . . D ADD(ZGRF,C0XSUB,C0XPRE,C0XOBJ) ; go for it and add a node
- W !,"INSERTING ",C0XCNT," TRIPLES"
- D UPDIE(.C0XFDA) ; commit the updates to the file
- ; next, mark the graph as finished
- S C0XEND=$$NOW^XLFDT
- W !," ENDED AT: ",C0XEND
- S C0XDIFF=$$FMDIFF^XLFDT(C0XEND,C0XSTART,2)
- W !," ELAPSED TIME: ",C0XDIFF," SECONDS"
- W !," APPROXIMATELY ",$P(C0XCNT/C0XDIFF,".")," TRIPLES PER SECOND"
- Q
- ;
-PROCESS2(ZRTN,ZRDF,ZGRF,ZMETA,FARY) ; PROCESS AN INCOMING RDF FILE
- ; ZRTN IS PASS BY REFERENCE AND RETURNS MESSAGES ABOUT THE PROCESSING
- ; ZRDF IS PASSED BY NAME AND IS THE GLOBAL CONTAINING THE RDF FILE
- ; ZGRF IS THE NAME OF THE GRAPH TO USE IN THE TRIPLE STORE FOR RESULTS
- ; ZMETA IS OPTIONAL AND IS THE NAME OF THE GRAPH TO STORE METADATA
- ;
- I '$D(FARY) D  ;
- . D INITFARY("C0XFARY")
- . S FARY="C0XFARY"
- D USEFARY(FARY)
- ;N BATCNT
- ;N BATMAX
- S BATCNT=0 ; BATCH COUNTER
- S BATMAX=10000 ; TRY BATCHES OF THIS SIZE
- ; -- first parse the rdf file with the MXML parser
- ;S C0XDOCID=$$PARSE^C0CNHIN(ZRDF,"C0XARRAY") ; PARSE WITH MXML
- S C0XDOCID=$$EN^MXMLDOM(ZRDF,"W")
- ; -- assign the MXLM dom global name to ZDOM
- S ZDOM=$NA(^TMP("MXMLDOM",$J,C0XDOCID))
- W !,$O(@ZDOM@(""),-1)," XML NODES PARSED"
- ; -- populate the metagraph to point to the graph with status unfinished
- S METAS=$$ANONS ; GET AN ANONOMOUS RANDOM SUBJECT
- I '$D(ZMETA) S ZMETA="_:G"_$$LKY9 ; RANDOM GRAPH NAME FOR METAGRAPH
- D ADD(ZMETA,METAS,"fmts:about",ZGRF,FARY) ; POINT THE META TO THE GRAPH
- D ADD(ZMETA,METAS,"fmts:status","unfinished",FARY) ; mark as unfinished
- ;S C0XDATE=$$FMDTOUTC^C0CUTIL($$NOW^XLFDT,"DT")
- S C0XDATE=$$NOW^XLFDT
- D ADD(ZMETA,METAS,"fmts:dateTime",C0XDATE,FARY)
- D UPDIE(.C0XFDA) ; commit the metagraph changes to the triple store
- ; -- 
- ; -- pull out the vocabularies in the RDF statement. marked with xmlns:
- ; -- put them in a local variable for quick reference
- ; -- TODO: create a graph for vocabularies and validate incoming against it
- ;
- S C0XVOC=""
- N ZI,ZJ,ZK S ZI=""
- F  S ZI=$O(@ZDOM@(1,"A",ZI)) Q:ZI=""  D  ; FOR EACH xmlns
- . S ZVOC=$P(ZI,"xmlns:",2)
- . I ZVOC'="" S C0XVOC(ZVOC)=$G(@ZDOM@(1,"A",ZI))
- ;W !,"VOCABS:" ZWR C0XVOC
- ;
- ; -- look for children called rdf:Description. quit if none. not an rdf file
- ;
- S ZI=$O(@ZDOM@(1,"C",""))
- I $G(@ZDOM@(1,"C",ZI))'="rdf:Description" D  Q  ; not an rdf file
- . W !,"Error. Not an RDF file. Cannot process."
- ;
- ; -- now process the rdf description children
- ;
- S ZI=""
- S (C0XSUB,C0XPRE,C0XOBJ)="" ; INITIALIZE subject, object and predicate
- F  S ZI=$O(@ZDOM@(1,"C",ZI)) Q:ZI=""  D  ;
- . ; -- we are skipping any child that is not rdf:Description
- . ; -- TODO: check to see if this is right in general
- . ;
- . IF $G(@ZDOM@(1,"C",ZI))'="rdf:Description" D  Q  ;
- . . W !,"SKIPPING NODE: ",ZI
- . ; -- now looking for the subject for the triples
- . S ZX=$G(@ZDOM@(ZI,"A","rdf:about"))
- . I ZX'="" D  ; we have the subject
- . . ;W " about: ",ZX
- . . S C0XSUB=ZX
- . E  D  ;
- . . S ZX=$G(@ZDOM@(ZI,"A","rdf:nodeID")) ; node id is another style of subject
- . . I ZX'="" D  ;
- . . . S C0XSUB=ZX
- . I C0XSUB="" S C0XSUB=$$ANONS ; DEFAULT TO BLANK SUBJECT
- . ; 
- . ; -- we now have the subject. the children of this node have the rest
- . ;
- . S ZJ="" ; for the children of the rdf:Description nodes
- . F  S ZJ=$O(@ZDOM@(ZI,"C",ZJ)) Q:ZJ=""  D  ; for each child
- . . S C0XPRE=@ZDOM@(ZJ) ; the predicate without a prefix
- . . S ZX=$G(@ZDOM@(ZJ,"A","xmlns")) ; name space
- . . I ZX'="" S C0XPRE=ZX_C0XPRE ; add the namespace prefix
- . . I C0XPRE[":" D  ; expand using vocabulary
- . . . N ZB,ZA
- . . . S ZB=$P(C0XPRE,":",1)
- . . . S ZA=$P(C0XPRE,":",2)
- . . . I $G(C0XVOC(ZB))'="" D  ;
- . . . . S C0XPRE=C0XVOC(ZB)_ZA ; expanded 
- . . S ZY=$G(@ZDOM@(ZJ,"A","rdf:resource")) ; potential object
- . . I ZY'="" D  Q ; 
- . . . S C0XOBJ=ZY ; object
- . . . D ADD2(ZGRF,C0XSUB,C0XPRE,C0XOBJ) ; finally. our first real triple
- . . ; -- this is an else because of the quit above
- . . S ZX=$G(@ZDOM@(ZJ,"A","rdf:nodeID")) ; fishing for nodeId object
- . . I ZX'="" D  Q  ; got one
- . . . S C0XOBJ=ZX ; we are using the incoming nodeIDs as object/subject 
- . . . ; without change... this could be foolish .. look at it again later
- . . . D ADD2(ZGRF,C0XSUB,C0XPRE,C0XOBJ) ; go for it and add a node
- . . S C0XOBJ=$G(@ZDOM@(ZJ,"T",1)) ; hopefully an object is here
- . . I C0XOBJ="" D  Q  ; not a happy situation
- . . . W !,"ERROR, NO OBJECT FOUND FOR NODE: ",ZJ
- . . D ADD2(ZGRF,C0XSUB,C0XPRE,C0XOBJ) ; go for it and add a node
- W !,"INSERTING ",C0XCNT," TRIPLES"
- I $D(C0XFDA) D UPDIE(.C0XFDA) ; commit the updates to the file
- ; next, mark the graph as finished
- S C0XEND=$$NOW^XLFDT
- W !," ENDED AT: ",C0XEND
- S C0XDIFF=$$FMDIFF^XLFDT(C0XEND,C0XSTART,2)
- W !," ELAPSED TIME: ",C0XDIFF," SECONDS"
- W !," APPROXIMATELY ",$P(C0XCNT/C0XDIFF,".")," TRIPLES PER SECOND"
- Q
- ;
-SHOW(ZN) ;
- ZWR ^TMP("MXMLDOM",$J,1,ZN,*)
- Q
- ;
-ANONS() ; RETURNS AN ANONOMOUS SUBJECT
- Q "_S:"_$$LKY9
- ;
-NEWG(NGRAPH,NMETA) ; CREATES A NEW META GRAPH, MARKS IT AS UNFINISHED
- ; THEN CREATES A NEW GRAPH AND POINTS THE METAGRAPH TO IT
- ; NGRAPH AND NMETA ARE PASSED BY REFERENCE AND ARE THE RETURN
- S NGRAPH="G"_$$LKY9
- S NMETA=NGRAPH_"A"
- Q
- ;
-ADD(ZG,ZS,ZP,ZO,FARY) ; ADD A TRIPLE TO THE TRIPLESTORE. ALL VALUES ARE TEXT
- ; THE FDA IS SET UP BUT THE FILES ARE NOT UPDATED. CALL UPDIE TO COMPLETE
- I '$D(FARY) D  ;
- . D INITFARY("C0XFARY")
- . S FARY="C0XFARY"
- D USEFARY(FARY)
- I '$D(C0XCNT) S C0XCNT=0
- N ZNODE
- S ZNODE="N"_$$LKY17
- N ZNARY ; GET READY TO CALL IENOFA
- S ZNARY("ZG",ZG)=""
- S ZNARY("ZS",ZS)=""
- S ZNARY("ZP",ZP)=""
- S ZNARY("ZO",ZO)=""
- D IENOFA(.ZIENS,.ZNARY,FARY) ; RESOLVE/ADD STRINGS
- ;S ZGIEN=$$IENOF(ZG) ; LAYGO TO GET IEN
- ;S ZSIEN=$$IENOF(ZS)
- ;S ZPIEN=$$IENOF(ZP)
- ;S ZOIEN=$$IENOF(ZO)
- ;I $D(C0XFDA) D UPDIE ; ADD THE STRINGS IF NEEDED
- S C0XCNT=C0XCNT+1
- S C0XFDA(C0XTFN,"?+"_C0XCNT_",",.01)=ZNODE
- S C0XFDA(C0XTFN,"?+"_C0XCNT_",",.02)=$O(ZIENS("IEN","ZG",""))
- S C0XFDA(C0XTFN,"?+"_C0XCNT_",",.03)=$O(ZIENS("IEN","ZS",""))
- S C0XFDA(C0XTFN,"?+"_C0XCNT_",",.04)=$O(ZIENS("IEN","ZP",""))
- S C0XFDA(C0XTFN,"?+"_C0XCNT_",",.05)=$O(ZIENS("IEN","ZO",""))
- ; REMEMBER TO CALL UPDIE WHEN YOU'RE DONE
- Q
- ;
-ADD2(ZG,ZS,ZP,ZO,FARY) ; ADD A TRIPLE TO THE TRIPLESTORE. ALL VALUES ARE TEXT
- ; THE FDA IS SET UP BUT THE FILES ARE NOT UPDATED. CALL UPDIE TO COMPLETE
- I '$D(FARY) D  ;
- . D INITFARY("C0XFARY")
- . S FARY="C0XFARY"
- D USEFARY(FARY)
- I '$D(C0XCNT) S C0XCNT=0
- N ZNODE
- S ZNODE="N"_$$LKY17
- N ZNARY ; GET READY TO CALL IENOFA
- S ZNARY("ZG",ZG)=""
- S ZNARY("ZS",ZS)=""
- S ZNARY("ZP",ZP)=""
- S ZNARY("ZO",ZO)=""
- D IENOFA(.ZIENS,.ZNARY,FARY) ; RESOLVE/ADD STRINGS
- ;S ZGIEN=$$IENOF(ZG) ; LAYGO TO GET IEN
- ;S ZSIEN=$$IENOF(ZS)
- ;S ZPIEN=$$IENOF(ZP)
- ;S ZOIEN=$$IENOF(ZO)
- ;I $D(C0XFDA) D UPDIE ; ADD THE STRINGS IF NEEDED
- S C0XCNT=C0XCNT+1
- S C0XFDA(C0XTFN,"?+"_C0XCNT_",",.01)=ZNODE
- S C0XFDA(C0XTFN,"?+"_C0XCNT_",",.02)=$O(ZIENS("IEN","ZG",""))
- S C0XFDA(C0XTFN,"?+"_C0XCNT_",",.03)=$O(ZIENS("IEN","ZS",""))
- S C0XFDA(C0XTFN,"?+"_C0XCNT_",",.04)=$O(ZIENS("IEN","ZP",""))
- S C0XFDA(C0XTFN,"?+"_C0XCNT_",",.05)=$O(ZIENS("IEN","ZO",""))
- S BATCNT=BATCNT+1
- I BATCNT=BATMAX D  ; BATCH IS DONE
- . D UPDIE(.C0XFDA)
- . K C0XFDA
- . S BATCNT=0 ; RESET COUNTER
- ; REMEMBER TO CALL UPDIE WHEN YOU'RE DONE
- Q
- ;
-LKY9() ;EXTRINIC THAT RETURNS A RANDOM 9 DIGIT NUMBER. USED FOR GENERATING
- ; UNIQUE NODE AND GRAPH NAMES
- N ZN,ZI
- S ZN=""
- F ZI=1:1:9 D  ;
- . S ZN=ZN_$R(10)
- Q ZN
- ;
-LKY17() ;EXTRINIC THAT RETURNS A RANDOM 9 DIGIT NUMBER. USED FOR GENERATING
- ; UNIQUE NODE AND GRAPH NAMES
- N ZN,ZI
- S ZN=""
- F ZI=1:1:17 D  ;
- . S ZN=ZN_$R(10)
- Q ZN
- ;
-IENOF(ZSTRING,FARY) ; EXTRINSIC WHICH RETURNS THE IEN OF ZS IN THE STRINGS FILE
- I '$D(FARY) D  ;
- . D INITFARY("C0XFARY")
- . S FARY="C0XFARY"
- N ZIEN
- S ZIEN=$O(@C0XSN@("B",ZSTRING,""))
- I ZIEN="" D  ;
- . S C0XFDA2(C0XSFN,"+1,",.01)=ZSTRING
- . D UPDIE(.C0XFDA2)
- . S ZIEN=$O(@C0XSN@("B",ZSTRING,""))
- . K C0XFDA2
- Q ZIEN
- ;
-IENOFA(ZOUTARY,ZINARY,FARY) ; RESOLVE STRINGS TO IEN IN STRINGS FILE 
- ; OR ADD THEM IF
- ; MISSING. ZINARY AND ZOUTARY ARE PASSED BY REFERENCE 
- ; ZINARY LOOKS LIKE ZINARY("VAR","VAL")=""
- ; RETURNS IN ZOUTARY OF THE FORM ZOUTARY("IEN","VAR",IEN)=""
- I '$D(FARY) D  ;
- . D INITFARY("C0XFARY")
- . S FARY="C0XFARY"
- K ZOUTARY ; START WITH CLEAN RESULTS
- K C0XFDA2 ; USE A SEPARATE FDA FOR THIS
- N ZI S ZI=""
- N ZV,ZIEN
- N ZCNT S ZCNT=0
- F  S ZI=$O(ZINARY(ZI)) Q:ZI=""  D  ; LOOK FOR MISSING STRINGS
- . S ZV=$O(ZINARY(ZI,""))
- . I $O(@C0XSN@("B",ZV,""))="" D  ;
- . . S ZCNT=ZCNT+1
- . . S C0XFDA2(C0XSFN,"+"_ZCNT_",",.01)=ZV
- I $D(C0XFDA2) D  ;
- . D UPDIE(.C0XFDA2) ; ADD MISSING STRINGS
- . K C0XFDA2 ; CLEAN UP
- F  S ZI=$O(ZINARY(ZI)) Q:ZI=""  D  ; NOT GET ALL IENS
- . S ZV=$O(ZINARY(ZI,""))
- . S ZIEN=$O(@C0XSN@("B",ZV,"")) ; THEY SHOULD BE THERE NOW
- . I ZIEN="" D  ;
- . . W !,"ERROR ADDING STRING: ",ZV
- . . B
- . S ZOUTARY("IEN",ZI,ZIEN)=""
- Q
- ;
-UPDIE(ZFDA) ; INTERNAL ROUTINE TO CALL UPDATE^DIE AND CHECK FOR ERRORS
- ; ZFDA IS PASSED BY REFERENCE
- ;ZWR ZFDA
- ;B
- K ZERR
- D CLEAN^DILF
- D UPDATE^DIE("","ZFDA","","ZERR")
- I $D(ZERR) S ZZERR=ZZERR ; ZZERR DOESN'T EXIST, 
- ; INVOKE THE ERROR TRAP IF TASKED
- ;. W "ERROR",!
- ;. ZWR ZERR
- ;. B
- K ZFDA
- Q
- ;
+C0XMAIN	; GPL - Fileman Triples entry point routine ;10/13/11  17:05
+	;;0.1;C0X;nopatch;noreleasedate;Build 5
+	;Copyright 2011 George Lilly.  Licensed under the terms of the GNU
+	;General Public License See attached copy of the License.
+	;
+	;This program is free software; you can redistribute it and/or modify
+	;it under the terms of the GNU General Public License as published by
+	;the Free Software Foundation; either version 2 of the License, or
+	;(at your option) any later version.
+	;
+	;This program is distributed in the hope that it will be useful,
+	;but WITHOUT ANY WARRANTY; without even the implied warranty of
+	;MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+	;GNU General Public License for more details.
+	;
+	;You should have received a copy of the GNU General Public License along
+	;with this program; if not, write to the Free Software Foundation, Inc.,
+	;51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
+	;
+	Q
+	;
+INITFARY(ZFARY)	; INITIALIZE FILE NUMBERS AND OTHER USEFUL THINGS
+	; FOR THE DEFAULT TRIPLE STORE. USE OTHER VALUES FOR SUPPORTING ADDITIONAL
+	; TRIPLE STORES
+	S @ZFARY@("C0XTFN")=172.101 ; TRIPLES FILE NUMBER
+	S @ZFARY@("C0XSFN")=172.201 ; TRIPLES STRINGS FILE NUMBER
+	S @ZFARY@("C0XTN")=$NA(^C0X(101)) ; TRIPLES GLOBAL NAME
+	S @ZFARY@("C0XSN")=$NA(^C0X(201)) ; STRING FILE GLOBAL NAME
+	;S @ZFARY@("C0XDIR")="/home/glilly/all_smart_patient_data/smart-rdf/"
+	S @ZFARY@("C0XDIR")="/home/george/fmts/trunk/samples/"
+	D USEFARY(ZFARY)
+	Q
+	;
+USEFARY(ZFARY)	; INITIALIZES VARIABLES SAVED IN ARRAY ZFARY
+	N ZI S ZI=""
+	F  S ZI=$O(@ZFARY@(ZI)) Q:ZI=""  D  
+	. ;N ZX
+	. S ZX="S "_ZI_"="""_@ZFARY@(ZI)_""""
+	. ;W !,ZX
+	. X ZX
+	Q
+	;
+IMPORT(FNAME,FDIR,FURL,FARY)	; EXTRINSIC THAT READS A FILE FROM THE STANDARD 
+	; DIRECTORY, LOADS IT INTO THE TRIPLESTORE AS TEXT, AND RETURNS THE
+	; NODE NAME OF THE TEXT TRIPLE
+	; FDIR IS THE OPTIONAL DIRECTORY (DEFAUTS TO STANDARD DIR)
+	; FURL IS THE OPTIONAL URI FOR ACCESSING THE FILE FROM THE TRIPLE STORE
+	; FARY IS THE OPTIONAL FILE ARRAY OF THE TRIPLE STORE TO USE
+	I '$D(FARY) D  ;
+	. D INITFARY("C0XFARY")
+	. S FARY="C0XFARY"
+	D USEFARY(FARY)
+	N ZD,ZTMP
+	I '$D(FDIR) S FDIR=C0XDIR ; DIRECTORY OF THE RDF FILE
+	I '$D(FURL) D  ;
+	. N ZN2 S ZN2=$TR(FNAME,".","_") ; REMOVE THE DOT FROM THE NAME
+	. S FURL=FDIR_ZN2
+	N ZTMP
+	S ZTMP=$NA(^TMP("C0X",$J,"FILEIN",1)) ; WHERE TO PUT THE INCOMING FILE
+	K @ZTMP ; MAKE SURE IT'S CLEAR
+	S C0XSTART=$$NOW^XLFDT
+	W !,"STARTED: ",C0XSTART
+	W !,"READING IN: ",FNAME
+	I '$$FILEIN(ZTMP,FDIR,FNAME,4) D  Q  ; QUIT IF NO SUCCESS
+	. W !,"ERROR READING FILE: ",FDIR,FNAME 
+	S ZRDF=$NA(^TMP("C0X",$J,"FILEIN")) ; WITHOUT THE SUBSCRIPT
+	W !,$O(@ZRDF@(""),-1)," LINES READ"
+	D INSRDF(ZRDF,FURL,FARY) ; IMPORT AND PROCESS THE RDF
+	Q
+	;
+WGET(ZURL,FARY)	; GET FROM THE INTERNET AN RDF FILE AND INSERT IT
+	;
+	I '$D(FARY) D  ;
+	. D INITFARY("C0XFARY")
+	. S FARY="C0XFARY"
+	D USEFARY(FARY)
+	;N ZLOC,ZTMP
+	K ZTMP
+	S ZLOC=$NA(^TMP("C0X","WGET",$J))
+	S C0XSTART=$$NOW^XLFDT
+	W !,"STARTED: ",C0XSTART
+	W !,"DOWNLOADING: ",ZURL
+	S OK=$$httpGET^%zewdGTM(ZURL,.ZTMP)
+	M @ZLOC=ZTMP
+	W !,$O(@ZLOC@(""),-1)," LINES READ"
+	D INSRDF(ZLOC,ZURL,FARY)
+	Q
+	;
+INSRDF(ZRDF,ZNAME,FARY)	; INSERT AN RDF FILE INTO THE STORE AND PROCESS
+	; ZRDF IS PASSED BY NAME
+	I '$D(FARY) D  ;
+	. D INITFARY("C0XFARY")
+	. S FARY="C0XFARY"
+	D USEFARY(FARY)
+	N ZGRAPH,ZSUBJECT
+	S ZGRAPH="_:G"_$$LKY9 ; RANDOM GRAPH NAME
+	S ZSUBJECT=$$ANONS ; RANDOM ANOYMOUS SUBJECT
+	D ADD(ZGRAPH,ZSUBJECT,"fmts:url",ZNAME,FARY)
+	N ZTXTNM
+	S ZTXTNM="_TXT_INCOMING_RDF_FILE_"_ZNAME_"_"_$$LKY9 ; NAME FOR TEXT NODE
+	D ADD(ZGRAPH,ZSUBJECT,"fmts:rdfSource",ZTXTNM,FARY)
+	D UPDIE(.C0XFDA) ; TRY IT OUT
+	K C0XCNT ;RESET FOR NEXT TIME
+	D STORETXT(ZRDF,ZTXTNM,FARY)
+	W !,"ADDED: ",ZGRAPH," ",ZSUBJECT," fmts:rdfSource ",ZTXTNM
+	D PROCESS(.G,ZRDF,ZNAME,ZGRAPH,FARY) ; PARSE AND INSERT THE RDF
+	Q
+	;
+STORETXT(ZTXT,ZNAME,FARY)	; STORE TEXT IN THE TRIPLESTORE AT ZNAME
+	;
+	I '$D(FARY) D  ;
+	. D INITFARY("C0XFARY")
+	. S FARY="C0XFARY"
+	D USEFARY(FARY)
+	N ZIEN
+	S ZIEN=$$IENOF(ZNAME,FARY) ; GET THE IEN
+	D CLEAN^DILF
+	K ZERR
+	D WP^DIE(C0XSFN,ZIEN_",",1,,ZTXT,"ZERR")
+	I $D(ZERR) D  ;
+	. ZWR ZERR
+	Q
+	; 
+GETTXT(ZRTN,ZNAME,FARY)	; RETURNS RDF SOURCE OR OTHER TEXT
+	; ZRTN IS PASSED BY REFERENCE
+	I '$D(FARY) D  ;
+	. D INITFARY("C0XFARY")
+	. S FARY="C0XFARY"
+	D USEFARY(FARY)
+	N ZIEN
+	S ZIEN=$$IENOF(ZNAME)
+	S OK=$$GET1^DIQ(C0XSFN,ZIEN_",",1,,"ZRTN")
+	Q
+	;
+WHERETXT(ZNAME,FARY)	; EXTRINSIC WHICH RETURNS THE NAME OF THE GLOBAL
+	; WHERE THE TEXT IS LOCATED. NAME IS THE NAME OF THE STRING
+	I '$D(FARY) D  ;
+	. D INITFARY("C0XFARY")
+	. S FARY="C0XFARY"
+	D USEFARY(FARY)
+	N ZIEN
+	S ZIEN=$$IENOF(ZNAME)
+	Q $NA(@C0XSN@(ZIEN,1))
+	;
+FILEIN(ZINTMP,ZDIR,ZFNAME,ZLVL)	; READS A FILE INTO ZINTMP USING FTG^%ZISH
+	; ZINTMP IS PASSED BY NAME AND INCLUDES THE NEW SUBSCRIPT
+	; IE ^TMP("C0X","FILEIN",1)
+	; ZLVL IN THIS CASE WOULD BE 3 INCREMENTING THE 1
+	; EXTRINSIC WHICH RETURNS THE RESULT OF FTG^%ZISH
+	S OK=$$FTG^%ZISH(ZDIR,FNAME,ZINTMP,ZLVL)
+	Q OK
+	;
+TESTPROC	; TEST PROCESS WITH EXISTING SMALL RDF FILE
+	S ZIN=$NA(^TMP("C0X",12226,"FILEIN"))
+	S ZGRAPH="/test/rdfFile"
+	S ZM="/test/rdfFile/meta"
+	D PROCESS(.G,ZIN,ZGRAPH,ZM)
+	Q
+	;
+PROCESS(ZRTN,ZRDF,ZGRF,ZMETA,FARY)	; PROCESS AN INCOMING RDF FILE
+	; ZRTN IS PASS BY REFERENCE AND RETURNS MESSAGES ABOUT THE PROCESSING
+	; ZRDF IS PASSED BY NAME AND IS THE GLOBAL CONTAINING THE RDF FILE
+	; ZGRF IS THE NAME OF THE GRAPH TO USE IN THE TRIPLE STORE FOR RESULTS
+	; ZMETA IS OPTIONAL AND IS THE NAME OF THE GRAPH TO STORE METADATA
+	;
+	I '$D(FARY) D  ;
+	. D INITFARY("C0XFARY")
+	. S FARY="C0XFARY"
+	D USEFARY(FARY)
+	; -- first parse the rdf file with the MXML parser
+	;S C0XDOCID=$$PARSE^C0CNHIN(ZRDF,"C0XARRAY") ; PARSE WITH MXML
+	S C0XDOCID=$$EN^MXMLDOM(ZRDF,"W")
+	; -- assign the MXLM dom global name to ZDOM
+	S ZDOM=$NA(^TMP("MXMLDOM",$J,C0XDOCID))
+	W !,$O(@ZDOM@(""),-1)," XML NODES PARSED"
+	; -- populate the metagraph to point to the graph with status unfinished
+	S METAS=$$ANONS ; GET AN ANONOMOUS RANDOM SUBJECT
+	I '$D(ZMETA) S ZMETA="_:G"_$$LKY9 ; RANDOM GRAPH NAME FOR METAGRAPH
+	D ADD(ZMETA,METAS,"fmts:about",ZGRF,FARY) ; POINT THE META TO THE GRAPH
+	D ADD(ZMETA,METAS,"fmts:status","unfinished",FARY) ; mark as unfinished
+	;S C0XDATE=$$FMDTOUTC^C0CUTIL($$NOW^XLFDT,"DT")
+	S C0XDATE=$$NOW^XLFDT
+	D ADD(ZMETA,METAS,"fmts:dateTime",C0XDATE,FARY)
+	D UPDIE(.C0XFDA) ; commit the metagraph changes to the triple store
+	; -- 
+	; -- pull out the vocabularies in the RDF statement. marked with xmlns:
+	; -- put them in a local variable for quick reference
+	; -- TODO: create a graph for vocabularies and validate incoming against it
+	;
+	S C0XVOC=""
+	N ZI,ZJ,ZK S ZI=""
+	F  S ZI=$O(@ZDOM@(1,"A",ZI)) Q:ZI=""  D  ; FOR EACH xmlns
+	. S ZVOC=$P(ZI,"xmlns:",2)
+	. I ZVOC'="" S C0XVOC(ZVOC)=$G(@ZDOM@(1,"A",ZI))
+	;W !,"VOCABS:" ZWR C0XVOC
+	;
+	; -- look for children called rdf:Description. quit if none. not an rdf file
+	;
+	S ZI=$O(@ZDOM@(1,"C",""))
+	I $G(@ZDOM@(1,"C",ZI))'="rdf:Description" D  Q  ; not an rdf file
+	. W !,"Error. Not an RDF file. Cannot process."
+	;
+	; -- now process the rdf description children
+	;
+	S ZI=""
+	S (C0XSUB,C0XPRE,C0XOBJ)="" ; INITIALIZE subject, object and predicate
+	F  S ZI=$O(@ZDOM@(1,"C",ZI)) Q:ZI=""  D  ;
+	. ; -- we are skipping any child that is not rdf:Description
+	. ; -- TODO: check to see if this is right in general
+	. ;
+	. IF $G(@ZDOM@(1,"C",ZI))'="rdf:Description" D  Q  ;
+	. . W !,"SKIPPING NODE: ",ZI
+	. ; -- now looking for the subject for the triples
+	. S ZX=$G(@ZDOM@(ZI,"A","rdf:about"))
+	. I ZX'="" D  ; we have the subject
+	. . ;W " about: ",ZX
+	. . S C0XSUB=ZX
+	. E  D  ;
+	. . S ZX=$G(@ZDOM@(ZI,"A","rdf:nodeID")) ; node id is another style of subject
+	. . I ZX'="" D  ;
+	. . . S C0XSUB=ZX
+	. I C0XSUB="" S C0XSUB=$$ANONS ; DEFAULT TO BLANK SUBJECT
+	. ; 
+	. ; -- we now have the subject. the children of this node have the rest
+	. ;
+	. S ZJ="" ; for the children of the rdf:Description nodes
+	. F  S ZJ=$O(@ZDOM@(ZI,"C",ZJ)) Q:ZJ=""  D  ; for each child
+	. . S C0XPRE=@ZDOM@(ZJ) ; the predicate without a prefix
+	. . S ZX=$G(@ZDOM@(ZJ,"A","xmlns")) ; name space
+	. . I ZX'="" S C0XPRE=ZX_C0XPRE ; add the namespace prefix
+	. . I C0XPRE[":" D  ; expand using vocabulary
+	. . . N ZB,ZA
+	. . . S ZB=$P(C0XPRE,":",1)
+	. . . S ZA=$P(C0XPRE,":",2)
+	. . . I $G(C0XVOC(ZB))'="" D  ;
+	. . . . S C0XPRE=C0XVOC(ZB)_ZA ; expanded 
+	. . S ZY=$G(@ZDOM@(ZJ,"A","rdf:resource")) ; potential object
+	. . I ZY'="" D  Q ; 
+	. . . S C0XOBJ=ZY ; object
+	. . . D ADD(ZGRF,C0XSUB,C0XPRE,C0XOBJ) ; finally. our first real triple
+	. . ; -- this is an else because of the quit above
+	. . S ZX=$G(@ZDOM@(ZJ,"A","rdf:nodeID")) ; fishing for nodeId object
+	. . I ZX'="" D  Q  ; got one
+	. . . S C0XOBJ=ZX ; we are using the incoming nodeIDs as object/subject 
+	. . . ; without change... this could be foolish .. look at it again later
+	. . . D ADD(ZGRF,C0XSUB,C0XPRE,C0XOBJ) ; go for it and add a node
+	. . S C0XOBJ=$G(@ZDOM@(ZJ,"T",1)) ; hopefully an object is here
+	. . I C0XOBJ="" D  Q  ; not a happy situation
+	. . . W !,"ERROR, NO OBJECT FOUND FOR NODE: ",ZJ
+	. . D ADD(ZGRF,C0XSUB,C0XPRE,C0XOBJ) ; go for it and add a node
+	W !,"INSERTING ",C0XCNT," TRIPLES"
+	D UPDIE(.C0XFDA) ; commit the updates to the file
+	; next, mark the graph as finished
+	S C0XEND=$$NOW^XLFDT
+	W !," ENDED AT: ",C0XEND
+	S C0XDIFF=$$FMDIFF^XLFDT(C0XEND,C0XSTART,2)
+	W !," ELAPSED TIME: ",C0XDIFF," SECONDS"
+	W !," APPROXIMATELY ",$P(C0XCNT/C0XDIFF,".")," TRIPLES PER SECOND"
+	Q
+	;
+SHOW(ZN)	;
+	ZWR ^TMP("MXMLDOM",$J,1,ZN,*)
+	Q
+	;
+ANONS()	; RETURNS AN ANONOMOUS SUBJECT
+	Q "_S:"_$$LKY9
+	;
+NEWG(NGRAPH,NMETA)	; CREATES A NEW META GRAPH, MARKS IT AS UNFINISHED
+	; THEN CREATES A NEW GRAPH AND POINTS THE METAGRAPH TO IT
+	; NGRAPH AND NMETA ARE PASSED BY REFERENCE AND ARE THE RETURN
+	S NGRAPH="G"_$$LKY9
+	S NMETA=NGRAPH_"A"
+	Q
+	;
+ADD(ZG,ZS,ZP,ZO,FARY)	; ADD A TRIPLE TO THE TRIPLESTORE. ALL VALUES ARE TEXT
+	; THE FDA IS SET UP BUT THE FILES ARE NOT UPDATED. CALL UPDIE TO COMPLETE
+	I '$D(FARY) D  ;
+	. D INITFARY("C0XFARY")
+	. S FARY="C0XFARY"
+	D USEFARY(FARY)
+	I '$D(C0XCNT) S C0XCNT=0
+	N ZNODE
+	S ZNODE="N"_$$LKY17
+	N ZNARY ; GET READY TO CALL IENOFA
+	S ZNARY("ZG",ZG)=""
+	S ZNARY("ZS",ZS)=""
+	S ZNARY("ZP",ZP)=""
+	S ZNARY("ZO",ZO)=""
+	D IENOFA(.ZIENS,.ZNARY,FARY) ; RESOLVE/ADD STRINGS
+	;S ZGIEN=$$IENOF(ZG) ; LAYGO TO GET IEN
+	;S ZSIEN=$$IENOF(ZS)
+	;S ZPIEN=$$IENOF(ZP)
+	;S ZOIEN=$$IENOF(ZO)
+	;I $D(C0XFDA) D UPDIE ; ADD THE STRINGS IF NEEDED
+	S C0XCNT=C0XCNT+1
+	S C0XFDA(C0XTFN,"?+"_C0XCNT_",",.01)=ZNODE
+	S C0XFDA(C0XTFN,"?+"_C0XCNT_",",.02)=$O(ZIENS("IEN","ZG",""))
+	S C0XFDA(C0XTFN,"?+"_C0XCNT_",",.03)=$O(ZIENS("IEN","ZS",""))
+	S C0XFDA(C0XTFN,"?+"_C0XCNT_",",.04)=$O(ZIENS("IEN","ZP",""))
+	S C0XFDA(C0XTFN,"?+"_C0XCNT_",",.05)=$O(ZIENS("IEN","ZO",""))
+	; REMEMBER TO CALL UPDIE WHEN YOU'RE DONE
+	Q
+	;
+LKY9()	;EXTRINIC THAT RETURNS A RANDOM 9 DIGIT NUMBER. USED FOR GENERATING
+	; UNIQUE NODE AND GRAPH NAMES
+	N ZN,ZI
+	S ZN=""
+	F ZI=1:1:9 D  ;
+	. S ZN=ZN_$R(10)
+	Q ZN
+	;
+LKY17()	;EXTRINIC THAT RETURNS A RANDOM 9 DIGIT NUMBER. USED FOR GENERATING
+	; UNIQUE NODE AND GRAPH NAMES
+	N ZN,ZI
+	S ZN=""
+	F ZI=1:1:17 D  ;
+	. S ZN=ZN_$R(10)
+	Q ZN
+	;
+IENOF(ZSTRING,FARY)	; EXTRINSIC WHICH RETURNS THE IEN OF ZS IN THE STRINGS FILE
+	I '$D(FARY) D  ;
+	. D INITFARY("C0XFARY")
+	. S FARY="C0XFARY"
+	N ZIEN
+	S ZIEN=$O(@C0XSN@("B",ZSTRING,""))
+	I ZIEN="" D  ;
+	. S C0XFDA2(C0XSFN,"+1,",.01)=ZSTRING
+	. D UPDIE(.C0XFDA2)
+	. S ZIEN=$O(@C0XSN@("B",ZSTRING,""))
+	. K C0XFDA2
+	Q ZIEN
+	;
+IENOFA(ZOUTARY,ZINARY,FARY)	; RESOLVE STRINGS TO IEN IN STRINGS FILE 
+	; OR ADD THEM IF
+	; MISSING. ZINARY AND ZOUTARY ARE PASSED BY REFERENCE 
+	; ZINARY LOOKS LIKE ZINARY("VAR","VAL")=""
+	; RETURNS IN ZOUTARY OF THE FORM ZOUTARY("IEN","VAR",IEN)=""
+	I '$D(FARY) D  ;
+	. D INITFARY("C0XFARY")
+	. S FARY="C0XFARY"
+	K ZOUTARY ; START WITH CLEAN RESULTS
+	K C0XFDA2 ; USE A SEPARATE FDA FOR THIS
+	N ZI S ZI=""
+	N ZV,ZIEN
+	N ZCNT S ZCNT=0
+	F  S ZI=$O(ZINARY(ZI)) Q:ZI=""  D  ; LOOK FOR MISSING STRINGS
+	. S ZV=$O(ZINARY(ZI,""))
+	. I $O(@C0XSN@("B",ZV,""))="" D  ;
+	. . S ZCNT=ZCNT+1
+	. . S C0XFDA2(C0XSFN,"+"_ZCNT_",",.01)=ZV
+	I $D(C0XFDA2) D  ;
+	. D UPDIE(.C0XFDA2) ; ADD MISSING STRINGS
+	. K C0XFDA2 ; CLEAN UP
+	F  S ZI=$O(ZINARY(ZI)) Q:ZI=""  D  ; NOT GET ALL IENS
+	. S ZV=$O(ZINARY(ZI,""))
+	. S ZIEN=$O(@C0XSN@("B",ZV,"")) ; THEY SHOULD BE THERE NOW
+	. I ZIEN="" D  ;
+	. . W !,"ERROR ADDING STRING: ",ZV
+	. . B
+	. S ZOUTARY("IEN",ZI,ZIEN)=""
+	Q
+	;
+UPDIE(ZFDA)	; INTERNAL ROUTINE TO CALL UPDATE^DIE AND CHECK FOR ERRORS
+	; ZFDA IS PASSED BY REFERENCE
+	;ZWR ZFDA
+	;B
+	K ZERR
+	D CLEAN^DILF
+	D UPDATE^DIE("","ZFDA","","ZERR")
+	I $D(ZERR) S ZZERR=ZZERR ; ZZERR DOESN'T EXIST, 
+	; INVOKE THE ERROR TRAP IF TASKED
+	;. W "ERROR",!
+	;. ZWR ZERR
+	;. B
+	K ZFDA
+	Q
+	;
Index: fmts/trunk/p/C0XTEST.m
===================================================================
--- fmts/trunk/p/C0XTEST.m	(revision 1281)
+++ fmts/trunk/p/C0XTEST.m	(revision 1294)
@@ -1,125 +1,125 @@
-C0XTEST ; GPL - Fileman Triples bulk load tester ;11/6/11  17:05
- ;;0.1;C0X;nopatch;noreleasedate;Build 1
- ;Copyright 2011 George Lilly.  Licensed under the terms of the GNU
- ;General Public License See attached copy of the License.
- ;
- ;This program is free software; you can redistribute it and/or modify
- ;it under the terms of the GNU General Public License as published by
- ;the Free Software Foundation; either version 2 of the License, or
- ;(at your option) any later version.
- ;
- ;This program is distributed in the hope that it will be useful,
- ;but WITHOUT ANY WARRANTY; without even the implied warranty of
- ;MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
- ;GNU General Public License for more details.
- ;
- ;You should have received a copy of the GNU General Public License along
- ;with this program; if not, write to the Free Software Foundation, Inc.,
- ;51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
- ;
- Q
- ;
-EN ; run the test
- ;
- k C0XFDA ; clear the node variable
- i '$d(^C0X(101,0)) d  ; global doesn't exist
- . s ^C0X(101,0)="C0X TRIPLE^172.101^1^1"
- n zg
- S zg="_:G"_$$LKY9 ; all nodes are in the same graph
- n zi
- f zi=1:1:10000 d  ; try a test of 10000 nodes
- . s C0XFDA(172.101,zi,.01)="N"_$$LKY17 ; node name
- . s C0XFDA(172.101,zi,.02)=zg
- . s C0XFDA(172.101,zi,.03)=$R(100000)
- . s C0XFDA(172.101,zi,.04)=$R(100000)
- . s C0XFDA(172.101,zi,.05)=$R(100000)
- S C0XST=$$NOW^XLFDT ; start of the insertion test
- W !,"INSERTION STARTS AT ",C0XST,!
- d BULKLOAD(.C0XFDA)
- s C0XEND=$$NOW^XLFDT ; end of the insertion test
- W !,"INSERTION ENDS AT ",C0XEND
- S C0XDIFF=$$FMDIFF^XLFDT(C0XEND,C0XST,2)
- W !," ELAPSED TIME: ",C0XDIFF," SECONDS"
- W !," APPROXIMATELY ",$P(10000/C0XDIFF,".")," NODES PER SECOND"
- q
- ;
-LKY9() ;EXTRINIC THAT RETURNS A RANDOM 9 DIGIT NUMBER. USED FOR GENERATING
- ; UNIQUE NODE AND GRAPH NAMES
- N ZN,ZI
- S ZN=""
- F ZI=1:1:9 D  ;
- . S ZN=ZN_$R(10)
- Q ZN
- ;
-LKY17() ;EXTRINIC THAT RETURNS A RANDOM 9 DIGIT NUMBER. USED FOR GENERATING
- ; UNIQUE NODE AND GRAPH NAMES
- N ZN,ZI
- S ZN=""
- F ZI=1:1:17 D  ;
- . S ZN=ZN_$R(10)
- Q ZN
- ;
-BULKLOAD(ZBFDA) ; BULK LOADER FOR LOADING TRIPLES INTO FILE 172.101
- ; USING GLOBAL SETS INSTEAD OF UPDATE^DIE
- ; QUITS IF FILE IS NOT 172.101
- ; EXPECTS AN FDA WITHOUT STRINGS FOR THE IENS, STARTING AT 1
- ; QUITS IF FIRST ENTRY IS NOT IENS 1
- ; ASSUMES THAT THE LAST IENS IS THE COUNT OF ENTRIES
- ; ZBFDA IS PASSED BY REFERENCE
- ;
- ; -- reserves a block of iens from file 172.101 by locking the zero node
- ; -- ^C0X(101,0) and adding the count of entries to piece 2 and 3
- ; -- then unlocking to minimize the duration of the lock
- ;
- W !,"USING BULKLOAD"
- I '$D(ZBFDA) Q  ; EMPTY FDA
- I $O(ZBFDA(""))'=172.101 Q  ; WRONG FILE
- N ZCNT,ZP3,ZP4
- ; -- find the number of nodes to insert
- S ZCNT=$O(ZBFDA(172.101,""),-1)
- I ZCNT="" D  Q  ;
- . W !,"ERROR IN BULK LOAD - INVALID NODE COUNT"
- . B
- ; -- lock the zero node and reserve a block of iens to insert
- W !,"LOCKING ZERO NODE"
- LOCK +^C0X(101,0)
- S ZP3=$P(^C0X(101,0),U,3)
- S ZP4=$P(^C0X(101,0),U,4)
- S $P(^C0X(101,0),U,3)=ZP3+ZCNT+1
- S $P(^C0X(101,0),U,4)=ZP4+ZCNT+1
- LOCK -^C0X(101,0)
- N ZI,ZN,ZG,ZS,ZP,ZO,ZIEN,ZBASE
- S ZBASE=ZP3 ; the last ien in the file
- W !,"ZERO NODE UNLOCKED, IENS RESERVED=",ZCNT
- W !,$$NOW^XLFDT
- S ZI=""
- F  S ZI=$O(ZBFDA(172.101,ZI)) Q:ZI=""  D  ;
- . S ZN=$G(ZBFDA(172.101,ZI,.01)) ; node name
- . I ZN="" D BLKERR Q  ; 
- . S ZG=$G(ZBFDA(172.101,ZI,.02)) ; graph pointer
- . I ZG="" D BLKERR Q  ; 
- . S ZS=$G(ZBFDA(172.101,ZI,.03)) ; subject pointer
- . I ZS="" D BLKERR Q  ; 
- . S ZP=$G(ZBFDA(172.101,ZI,.04)) ; predicate pointer
- . I ZP="" D BLKERR Q  ; 
- . S ZO=$G(ZBFDA(172.101,ZI,.05)) ; object pointer
- . I ZO="" D BLKERR Q  ; 
- . S ZIEN=ZI+ZBASE ; the new ien
- . S ^C0X(101,ZIEN,0)=ZN_U_ZG_U_ZS_U_ZP_U_ZO ; set the zero node
- . S ^C0X(101,"B",ZN,ZIEN)="" ; the B index
- . S ^C0X(101,"G",ZG,ZIEN)="" ; the G for Graph index
- . S ^C0X(101,"SPO",ZS,ZP,ZO)=""
- . S ^C0X(101,"SOP",ZS,ZO,ZP)=""
- . S ^C0X(101,"OPS",ZO,ZP,ZS)=""
- . S ^C0X(101,"OSP",ZO,ZS,ZP)=""
- . S ^C0X(101,"GOPS",ZG,ZO,ZP,ZS)=""
- . S ^C0X(101,"GOSP",ZG,ZO,ZS,ZP)=""
- . S ^C0X(101,"GPSO",ZG,ZP,ZS,ZO)=""
- . S ^C0X(101,"GSPO",ZG,ZS,ZP,ZO)=""
- Q
- ;
-BLKERR ; 
- W !,"ERROR IN BULK LOAD",! ZWR ZBFDA(ZI)
- B
- Q
- ;
+C0XTEST	; GPL - Fileman Triples bulk load tester ;11/6/11  17:05
+	;;0.1;C0X;nopatch;noreleasedate;Build 5
+	;Copyright 2011 George Lilly.  Licensed under the terms of the GNU
+	;General Public License See attached copy of the License.
+	;
+	;This program is free software; you can redistribute it and/or modify
+	;it under the terms of the GNU General Public License as published by
+	;the Free Software Foundation; either version 2 of the License, or
+	;(at your option) any later version.
+	;
+	;This program is distributed in the hope that it will be useful,
+	;but WITHOUT ANY WARRANTY; without even the implied warranty of
+	;MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+	;GNU General Public License for more details.
+	;
+	;You should have received a copy of the GNU General Public License along
+	;with this program; if not, write to the Free Software Foundation, Inc.,
+	;51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
+	;
+	Q
+	;
+EN	; run the test
+	;
+	k C0XFDA ; clear the node variable
+	i '$d(^C0X(101,0)) d  ; global doesn't exist
+	. s ^C0X(101,0)="C0X TRIPLE^172.101^1^1"
+	n zg
+	S zg="_:G"_$$LKY9 ; all nodes are in the same graph
+	n zi
+	f zi=1:1:100000 d  ; try a test of 10000 nodes
+	. s C0XFDA(172.101,zi,.01)="N"_$$LKY17 ; node name
+	. s C0XFDA(172.101,zi,.02)=zg
+	. s C0XFDA(172.101,zi,.03)=$R(100000)
+	. s C0XFDA(172.101,zi,.04)=$R(100000)
+	. s C0XFDA(172.101,zi,.05)=$R(100000)
+	S C0XST=$$NOW^XLFDT ; start of the insertion test
+	W !,"INSERTION STARTS AT ",C0XST,!
+	d BULKLOAD(.C0XFDA)
+	s C0XEND=$$NOW^XLFDT ; end of the insertion test
+	W !,"INSERTION ENDS AT ",C0XEND
+	S C0XDIFF=$$FMDIFF^XLFDT(C0XEND,C0XST,2)
+	W !," ELAPSED TIME: ",C0XDIFF," SECONDS"
+	I C0XDIFF>0 W !," APPROXIMATELY ",$P(100000/C0XDIFF,".")," NODES PER SECOND"
+	q
+	;
+LKY9()	;EXTRINIC THAT RETURNS A RANDOM 9 DIGIT NUMBER. USED FOR GENERATING
+	; UNIQUE NODE AND GRAPH NAMES
+	N ZN,ZI
+	S ZN=""
+	F ZI=1:1:9 D  ;
+	. S ZN=ZN_$R(10)
+	Q ZN
+	;
+LKY17()	;EXTRINIC THAT RETURNS A RANDOM 9 DIGIT NUMBER. USED FOR GENERATING
+	; UNIQUE NODE AND GRAPH NAMES
+	N ZN,ZI
+	S ZN=""
+	F ZI=1:1:17 D  ;
+	. S ZN=ZN_$R(10)
+	Q ZN
+	;
+BULKLOAD(ZBFDA)	; BULK LOADER FOR LOADING TRIPLES INTO FILE 172.101
+	; USING GLOBAL SETS INSTEAD OF UPDATE^DIE
+	; QUITS IF FILE IS NOT 172.101
+	; EXPECTS AN FDA WITHOUT STRINGS FOR THE IENS, STARTING AT 1
+	; QUITS IF FIRST ENTRY IS NOT IENS 1
+	; ASSUMES THAT THE LAST IENS IS THE COUNT OF ENTRIES
+	; ZBFDA IS PASSED BY REFERENCE
+	;
+	; -- reserves a block of iens from file 172.101 by locking the zero node
+	; -- ^C0X(101,0) and adding the count of entries to piece 2 and 3
+	; -- then unlocking to minimize the duration of the lock
+	;
+	W !,"USING BULKLOAD"
+	I '$D(ZBFDA) Q  ; EMPTY FDA
+	I $O(ZBFDA(""))'=172.101 Q  ; WRONG FILE
+	N ZCNT,ZP3,ZP4
+	; -- find the number of nodes to insert
+	S ZCNT=$O(ZBFDA(172.101,""),-1)
+	I ZCNT="" D  Q  ;
+	. W !,"ERROR IN BULK LOAD - INVALID NODE COUNT"
+	. B
+	; -- lock the zero node and reserve a block of iens to insert
+	W !,"LOCKING ZERO NODE"
+	LOCK +^C0X(101,0)
+	S ZP3=$P(^C0X(101,0),U,3)
+	S ZP4=$P(^C0X(101,0),U,4)
+	S $P(^C0X(101,0),U,3)=ZP3+ZCNT+1
+	S $P(^C0X(101,0),U,4)=ZP4+ZCNT+1
+	LOCK -^C0X(101,0)
+	N ZI,ZN,ZG,ZS,ZP,ZO,ZIEN,ZBASE
+	S ZBASE=ZP3 ; the last ien in the file
+	W !,"ZERO NODE UNLOCKED, IENS RESERVED=",ZCNT
+	W !,$$NOW^XLFDT
+	S ZI=""
+	F  S ZI=$O(ZBFDA(172.101,ZI)) Q:ZI=""  D  ;
+	. S ZN=$G(ZBFDA(172.101,ZI,.01)) ; node name
+	. I ZN="" D BLKERR Q  ; 
+	. S ZG=$G(ZBFDA(172.101,ZI,.02)) ; graph pointer
+	. I ZG="" D BLKERR Q  ; 
+	. S ZS=$G(ZBFDA(172.101,ZI,.03)) ; subject pointer
+	. I ZS="" D BLKERR Q  ; 
+	. S ZP=$G(ZBFDA(172.101,ZI,.04)) ; predicate pointer
+	. I ZP="" D BLKERR Q  ; 
+	. S ZO=$G(ZBFDA(172.101,ZI,.05)) ; object pointer
+	. I ZO="" D BLKERR Q  ; 
+	. S ZIEN=ZI+ZBASE ; the new ien
+	. S ^C0X(101,ZIEN,0)=ZN_U_ZG_U_ZS_U_ZP_U_ZO ; set the zero node
+	. S ^C0X(101,"B",ZN,ZIEN)="" ; the B index
+	. S ^C0X(101,"G",ZG,ZIEN)="" ; the G for Graph index
+	. S ^C0X(101,"SPO",ZS,ZP,ZO)=""
+	. S ^C0X(101,"SOP",ZS,ZO,ZP)=""
+	. S ^C0X(101,"OPS",ZO,ZP,ZS)=""
+	. S ^C0X(101,"OSP",ZO,ZS,ZP)=""
+	. S ^C0X(101,"GOPS",ZG,ZO,ZP,ZS)=""
+	. S ^C0X(101,"GOSP",ZG,ZO,ZS,ZP)=""
+	. S ^C0X(101,"GPSO",ZG,ZP,ZS,ZO)=""
+	. S ^C0X(101,"GSPO",ZG,ZS,ZP,ZO)=""
+	Q
+	;
+BLKERR	; 
+	W !,"ERROR IN BULK LOAD",! ZWR ZBFDA(ZI)
+	B
+	Q
+	;
