source: fmts/trunk/p/C0XF2N.m@ 1644

Last change on this file since 1644 was 1633, checked in by George Lilly, 11 years ago

bnf enhancements

File size: 22.1 KB
Line 
1C0XF2N ; GPL - Fileman Triples entry point routine ;10/13/11 17:05
2 ;;1.0;FILEMAN TRIPLE STORE;;Sep 26, 2012;Build 11
3 ;Copyright 2011 George Lilly. Licensed under the terms of the GNU
4 ;General Public License See attached copy of the License.
5 ;
6 ;This program is free software; you can redistribute it and/or modify
7 ;it under the terms of the GNU General Public License as published by
8 ;the Free Software Foundation; either version 2 of the License, or
9 ;(at your option) any later version.
10 ;
11 ;This program is distributed in the hope that it will be useful,
12 ;but WITHOUT ANY WARRANTY; without even the implied warranty of
13 ;MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 ;GNU General Public License for more details.
15 ;
16 ;You should have received a copy of the GNU General Public License along
17 ;with this program; if not, write to the Free Software Foundation, Inc.,
18 ;51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
19 ;
20 Q
21 ;
22 ; This is based on C0XMAIN but experiments with a fast load for triples
23 ; that will write directly to the fileman global
24 ; The file 172.101 is a F2N design style for triples, which means
25 ; that it is a Flat file with no subfiles, all fields at the root
26 ; ... it is a "2" file solution which means all strings are stored in
27 ; ... strings file and pointed to by the triples file
28 ; ... it is an N file because it has generated Node IDs instead of
29 ; ... DINUM which would use the IEN for the Node ID.
30 ; gpl 11/04/2011
31 ;
32INITFARY(ZFARY) ; INITIALIZE FILE NUMBERS AND OTHER USEFUL THINGS
33 ; FOR THE DEFAULT TRIPLE STORE. USE OTHER VALUES FOR SUPPORTING ADDITIONAL
34 ; TRIPLE STORES
35 I $D(@ZFARY) Q ; ALREADY INITIALIZED
36 S @ZFARY@("C0XTFN")=172.101 ; TRIPLES FILE NUMBER
37 S @ZFARY@("C0XSFN")=172.201 ; TRIPLES STRINGS FILE NUMBER
38 S @ZFARY@("C0XTN")=$NA(^C0X(101)) ; TRIPLES GLOBAL NAME
39 S @ZFARY@("C0XSN")=$NA(^C0X(201)) ; STRING FILE GLOBAL NAME
40 S @ZFARY@("C0XDIR")="/home/glilly/fmts/trunk/samples/smart-new/"
41 S @ZFARY@("BLKLOAD")=1 ; this file supports block load
42 S @ZFARY@("FMTSSTYLE")="F2N" ; fileman style
43 S @ZFARY@("REPLYFMT")="array"
44 D USEFARY(ZFARY)
45 Q
46 ;
47USEFARY(ZFARY) ; INITIALIZES VARIABLES SAVED IN ARRAY ZFARY
48 N ZI S ZI=""
49 F S ZI=$O(@ZFARY@(ZI)) Q:ZI="" D
50 . ;N ZX
51 . S ZX="S "_ZI_"="""_@ZFARY@(ZI)_""""
52 . ;W !,ZX
53 . X ZX
54 Q
55 ;
56FILEIN ; INTERACTIVE ENTRY POINT FOR OPTION TO READ IN A FILE
57 I '$D(C0XFARY) D INITFARY("C0XFARY")
58 D USEFARY("C0XFARY")
59 S DIR(0)="F^3:240"
60 S DIR("A")="File Directory"
61 S DIR("B")=C0XDIR
62 D ^DIR
63 I Y="^" Q ;
64 S C0XDIR=Y
65 S C0XFARY("C0XDIR")=Y
66 S DIR(0)="F^3:240"
67 S DIR("A")="File Name"
68 I '$D(C0XFN) S DIR("B")="qds.rdf"
69 E S DIR("B")=C0XFN
70 D ^DIR
71 I Y="" Q ;
72 I Y="^" Q ;
73 S C0XFN=Y
74 D IMPORT(C0XFN,C0XDIR,,"C0XFARY")
75 K C0XFDA
76 Q
77 ;
78IMPORT(FNAME,INDIR,INURL,FARY) ; EXTRINSIC THAT READS A FILE FROM THE STANDARD
79 ; DIRECTORY, LOADS IT INTO THE TRIPLESTORE AS TEXT, AND RETURNS THE
80 ; NODE NAME OF THE TEXT TRIPLE
81 ; INDIR IS THE OPTIONAL DIRECTORY (DEFAUTS TO STANDARD DIR)
82 ; INURL IS THE OPTIONAL URI FOR ACCESSING THE FILE FROM THE TRIPLE STORE
83 ; FARY IS THE OPTIONAL FILE ARRAY OF THE TRIPLE STORE TO USE
84 I '$D(FARY) D ;
85 . D INITFARY("C0XFARY")
86 . S FARY="C0XFARY"
87 D USEFARY(FARY)
88 N ZD,ZTMP
89 I '$D(INDIR) S INDIR=C0XDIR ; DIRECTORY OF THE RDF FILE
90 I $G(INURL)="" D ;
91 . ;N ZN2 S ZN2=$P(FNAME,".",1)_"_"_$P(FNAME,".",2) ; REMOVE THE DOT
92 . ;S INURL=FDIR_ZN2
93 . S INURL=INDIR_FNAME
94 N ZTMP
95 S ZTMP=$NA(^TMP("C0X",$J,"FILEIN",1)) ; WHERE TO PUT THE INCOMING FILE
96 K @ZTMP ; MAKE SURE IT'S CLEAR
97 S C0XSTART=$$NOW^XLFDT
98 W !,"STARTED: ",C0XSTART
99 W !,"READING IN: ",FNAME
100 I '$$FILEREAD(ZTMP,INDIR,FNAME,4) D Q ; QUIT IF NO SUCCESS
101 . W !,"ERROR READING FILE: ",INDIR,FNAME
102 S ZRDF=$NA(^TMP("C0X",$J,"FILEIN")) ; WITHOUT THE SUBSCRIPT
103 W !,$O(@ZRDF@(""),-1)," LINES READ"
104 D INSRDF(ZRDF,INURL,FARY) ; IMPORT AND PROCESS THE RDF
105 K INURL
106 K C0XFDA
107 ;K ^TMP("MXMLDOM",$J)
108 Q
109 ;
110WGET(ZURL,FARY) ; GET FROM THE INTERNET AN RDF FILE AND INSERT IT
111 ;
112 I '$D(FARY) D ;
113 . D INITFARY("C0XFARY")
114 . S FARY="C0XFARY"
115 D USEFARY(FARY)
116 ;N ZLOC,ZTMP
117 K ZTMP
118 S ZLOC=$NA(^TMP("C0X","WGET",$J))
119 K @ZLOC
120 S C0XSTART=$$NOW^XLFDT
121 W !,"STARTED: ",C0XSTART
122 W !,"DOWNLOADING: ",ZURL
123 S OK=$$httpGET^%zewdGTM(ZURL,.ZTMP)
124 M @ZLOC=ZTMP
125 S C0XLINES=$O(@ZLOC@(""),-1)
126 W !,C0XLINES," LINES READ"
127 S C0XDLC=$$NOW^XLFDT ; DOWNLOAD COMPLETE
128 W !,"DOWNLOAD COMPLETE AT ",C0XDLC
129 S C0XDIFF=$$FMDIFF^XLFDT(C0XDLC,C0XSTART,2)
130 W !," ELAPSED TIME: ",C0XDIFF," SECONDS"
131 I C0XDIFF'=0 W !," APPROXIMATELY ",$P(C0XLINES/C0XDIFF,".")," LINES PER SEC"
132 D INSRDF(ZLOC,ZURL,FARY)
133 Q
134 ;
135INSRDF(ZRDF,ZNAME,FARY) ; INSERT AN RDF FILE INTO THE STORE AND PROCESS
136 ; ZRDF IS PASSED BY NAME
137 I '$D(FARY) D ;
138 . D INITFARY("C0XFARY")
139 . S FARY="C0XFARY"
140 D USEFARY(FARY)
141 S BATCNT=0 ; BATCH COUNTER
142 S BATMAX=10000 ; TRY BATCHES OF THIS SIZE
143 N ZGRAPH,ZSUBJECT
144 S ZGRAPH="_:G"_$$LKY9 ; RANDOM GRAPH NAME
145 S ZSUBJECT=$$ANONS() ; RANDOM ANOYMOUS SUBJECT
146 D ADD(ZGRAPH,ZSUBJECT,"fmts:url",ZNAME,FARY)
147 N ZTXTNM
148 S ZTXTNM="_TXT_INCOMING_RDF_FILE_"_ZNAME_"_"_$$LKY9 ; NAME FOR TEXT NODE
149 D ADD(ZGRAPH,ZSUBJECT,"fmts:fileSource",ZTXTNM,FARY)
150 D ADD(ZGRAPH,ZSUBJECT,"fmts:fileTag",$$name2tag(ZNAME),FARY)
151 D SWUPDIE(.C0XFDA) ; TRY IT OUT
152 K C0XCNT ;RESET FOR NEXT TIME
153 D STORETXT(ZRDF,ZTXTNM,FARY)
154 W !,"ADDED: ",ZGRAPH," ",ZSUBJECT," fmts:fileSource ",ZTXTNM
155 D PROCESS(.G,ZRDF,ZNAME,ZGRAPH,FARY) ; PARSE AND INSERT THE RDF
156 Q
157 ;
158name2tag(zname) ; extrinsic which returns a tag derived from a name
159 ; /home/vista/project.xml ==> project
160 q $p($re($p($re(zname),"/")),".")
161 ;
162STORETXT(ZTXT,ZNAME,FARY) ; STORE TEXT IN THE TRIPLESTORE AT ZNAME
163 ;
164 I '$D(FARY) D ;
165 . D INITFARY("C0XFARY")
166 . S FARY="C0XFARY"
167 D USEFARY(FARY)
168 N ZIEN
169 S ZIEN=$$IENOF(ZNAME,FARY) ; GET THE IEN
170 D CLEAN^DILF
171 K ZERR
172 D WP^DIE(C0XSFN,ZIEN_",",1,,ZTXT,"ZERR")
173 I $D(ZERR) D Q ;
174 . W !,"ERROR CREATING WORD PROCESSING FIELD"
175 . S C0XERR="ERROR CREATING WORD PROCESSING FIELD"
176 . D ^%ZTER ; error trap
177 Q
178 ;
179GETTXT(ZRTN,ZNAME,FARY) ; RETURNS RDF SOURCE OR OTHER TEXT
180 ; ZRTN IS PASSED BY REFERENCE
181 I '$D(FARY) D ;
182 . D INITFARY("C0XFARY")
183 . S FARY="C0XFARY"
184 D USEFARY(FARY)
185 N ZIEN
186 S ZIEN=$$IENOF(ZNAME)
187 S OK=$$GET1^DIQ(C0XSFN,ZIEN_",",1,,"ZRTN")
188 Q
189 ;
190WHERETXT(ZNAME,FARY) ; EXTRINSIC WHICH RETURNS THE NAME OF THE GLOBAL
191 ; WHERE THE TEXT IS LOCATED. NAME IS THE NAME OF THE STRING
192 I '$D(FARY) D ;
193 . D INITFARY("C0XFARY")
194 . S FARY="C0XFARY"
195 D USEFARY(FARY)
196 N ZIEN
197 S ZIEN=$$IENOF(ZNAME)
198 Q $NA(@C0XSN@(ZIEN,1))
199 ;
200FILEREAD(ZINTMP,ZDIR,ZFNAME,ZLVL) ; READS A FILE INTO ZINTMP USING FTG^%ZISH
201 ; ZINTMP IS PASSED BY NAME AND INCLUDES THE NEW SUBSCRIPT
202 ; IE ^TMP("C0X","FILEIN",1)
203 ; ZLVL IN THIS CASE WOULD BE 3 INCREMENTING THE 1
204 ; EXTRINSIC WHICH RETURNS THE RESULT OF FTG^%ZISH
205 S OK=$$FTG^%ZISH(ZDIR,FNAME,ZINTMP,ZLVL)
206 Q OK
207 ;
208TESTPROC ; TEST PROCESS WITH EXISTING SMALL RDF FILE
209 S ZIN=$NA(^TMP("C0X",12226,"FILEIN"))
210 S ZGRAPH="/test/rdfFile"
211 S ZM="/test/rdfFile/meta"
212 D PROCESS(.G,ZIN,ZGRAPH,ZM)
213 Q
214 ;
215VISTAOWL ;
216 S ZRDF=$NA(^TMP("C0X",542,"FILEIN"))
217 S ZNAME="/home/glilly/vistaowl/VistAOWL.owl"
218 S ZGRAPH="_:G431590209"
219 S FARY="C0XFARY"
220 D INITFARY(FARY)
221 S C0XDOCID=1
222 S BATCNT=0
223 S BATMAX=10000
224 D PROCESS(.G,ZRDF,ZGRAPH,ZNAME,FARY)
225 Q
226 ;
227PROCESS(ZRTN,ZRDF,ZGRF,ZMETA,FARY) ; PROCESS AN INCOMING RDF FILE
228 ; ZRTN IS PASS BY REFERENCE AND RETURNS MESSAGES ABOUT THE PROCESSING
229 ; ZRDF IS PASSED BY NAME AND IS THE GLOBAL CONTAINING THE RDF FILE
230 ; ZGRF IS THE NAME OF THE GRAPH TO USE IN THE TRIPLE STORE FOR RESULTS
231 ; ZMETA IS OPTIONAL AND IS THE NAME OF THE GRAPH TO STORE METADATA
232 ;
233 I '$D(FARY) D ;
234 . D INITFARY("C0XFARY")
235 . S FARY="C0XFARY"
236 D USEFARY(FARY)
237 ;N BATCNT
238 ;N BATMAX
239 ; -- first parse the rdf file with the MXML parser
240 ;S C0XDOCID=$$PARSE^C0CNHIN(ZRDF,"C0XARRAY") ; PARSE WITH MXML
241 S C0XDLC2=$$NOW^XLFDT ; START OF PARSE
242 I @ZRDF@(1)'["<?xml" D Q ;
243 . K @ZRDF ; don't need the input buffer
244 . W !,"Not an XML file"
245 N ZZI S ZZI=""
246 F S ZZI=$O(@ZRDF@(ZZI)) Q:ZZI="" D ;
247 . N ZZX S ZZX=@ZRDF@(ZZI)
248 . I ZZX["Name >" S ZZX=$P(ZZX,"Name >",1)_"Name>"_$P(ZZX,"Name >",2)
249 . I ZZX["Device >" S ZZX=$P(ZZX,"Device >",1)_"Device>"_$P(ZZX,"Device >",2)
250 . S @ZRDF@(ZZI)=ZZX
251 S C0XDOCID=$$EN^MXMLDOM(ZRDF,"W") ;
252 ;B
253 K @ZRDF ; DON'T NEED INPUT BUFFER ANYMORE
254 ; -- assign the MXLM dom global name to ZDOM
255 S ZDOM=$NA(^TMP("MXMLDOM",$J,C0XDOCID))
256 ;S ZDOM=$NA(^TMP("MXMLDOM",16850,C0XDOCID)) ;VISTAOWL DOM
257 S C0XNODE=$O(@ZDOM@(""),-1)
258 W !,C0XNODE," XML NODES PARSED"
259 S C0XPRS=$$NOW^XLFDT ; PARSE COMPLETE
260 W !,"PARSE COMPLETE AT ",C0XPRS
261 S C0XDIFF=$$FMDIFF^XLFDT(C0XPRS,C0XDLC2,2)
262 W !," ELAPSED TIME: ",C0XDIFF," SECONDS"
263 I C0XDIFF'=0 D ;
264 . W !," APPROXIMATELY ",$P(C0XNODE/C0XDIFF,".")," NODES PER SECOND"
265 ; -- populate the metagraph to point to the graph with status unfinished
266 S METAS=$$ANONS ; GET AN ANONOMOUS RANDOM SUBJECT
267 I '$D(ZMETA) S ZMETA="_:G"_$$LKY9 ; RANDOM GRAPH NAME FOR METAGRAPH
268 D ADD(ZMETA,METAS,"fmts:about",ZGRF,FARY) ; POINT THE META TO THE GRAPH
269 D ADD(ZMETA,METAS,"fmts:status","unfinished",FARY) ; mark as unfinished
270 W !,"INSERTING GRAPH: ",ZGRF
271 ;S C0XDATE=$$FMDTOUTC^C0CUTIL($$NOW^XLFDT,"DT")
272 S C0XDATE=$$NOW^XLFDT
273 D ADD(ZMETA,METAS,"fmts:dateTime",C0XDATE,FARY)
274 D SWUPDIE(.C0XFDA) ; commit the metagraph changes to the triple store
275 ; --
276 ; -- pull out the vocabularies in the RDF statement. marked with xmlns:
277 ; -- put them in a local variable for quick reference
278 ; -- TODO: create a graph for vocabularies and validate incoming against it
279 ;
280 S C0XVOC=""
281 N ZI,ZJ,ZK S ZI=""
282 F S ZI=$O(@ZDOM@(1,"A",ZI)) Q:ZI="" D ; FOR EACH xmlns
283 . S ZVOC=$P(ZI,"xmlns:",2)
284 . I ZVOC'="" S C0XVOC(ZVOC)=$G(@ZDOM@(1,"A",ZI))
285 I $D(DEBUG) D ;
286 . W !,"VOCABS:"
287 . N ZZ S ZZ=""
288 . F S ZZ=$O(C0XVOC(ZZ)) Q:ZZ="" W !,ZZ,":",C0XVOC(ZZ)
289 ;
290 ; -- look for children called rdf:Description. quit if none. not an rdf file
291 ;
292 S C0XTYPE("rdf:Description")=1
293 S C0XTYPE("owl:ObjectProperty")=1
294 S C0XTYPE("owl:Ontology")=1
295 S C0XTYPE("owl:Class")=1
296 S C0XTYPE("rdfs:subClassOf")=1
297 S C0XTYPE("rdf:RDF")=1
298 S ZI=$O(@ZDOM@(1,"C",""))
299 I '$G(C0XTYPE(@ZDOM@(1,"C",ZI))) D ;Q ; not an rdf file
300 . W !,"Unusual RDF file ",@ZDOM@(1,"C",ZI)
301 . ;W !,"Error. Not an RDF file. Cannot process."
302 . D SHOW(1)
303 ;
304 ; -- now process the rdf description children
305 ;
306 S ZI=""
307 S (C0XSUB,C0XPRE,C0XOBJ)="" ; INITIALIZE subject, object and predicate
308 F S ZI=$O(@ZDOM@(1,"C",ZI)) Q:ZI="" D ;
309 . ; -- we are skipping any child that is not rdf:Description
310 . ; -- TODO: check to see if this is right in general
311 . ;
312 . IF '$G(C0XTYPE(@ZDOM@(1,"C",ZI))) D Q ;
313 . . W !,"SKIPPING NODE: ",ZI
314 . ; -- now looking for the subject for the triples
315 . S ZX=$G(@ZDOM@(ZI,"A","rdf:about"))
316 . I ZX'="" D ; we have the subject
317 . . ;W " about: ",ZX
318 . . S C0XSUB=ZX
319 . E D ;
320 . . S ZX=$G(@ZDOM@(ZI,"A","rdf:nodeID")) ; node id is another style of subject
321 . . I ZX'="" D ;
322 . . . S C0XSUB=ZX
323 . I C0XSUB="" S C0XSUB=$$ANONS ; DEFAULT TO BLANK SUBJECT
324 . ;
325 . ; -- we now have the subject. the children of this node have the rest
326 . ;
327 . S ZJ="" ; for the children of the rdf:Description nodes
328 . F S ZJ=$O(@ZDOM@(ZI,"C",ZJ)) Q:ZJ="" D ; for each child
329 . . S C0XPRE=@ZDOM@(ZJ) ; the predicate without a prefix
330 . . S ZX=$G(@ZDOM@(ZJ,"A","xmlns")) ; name space
331 . . I ZX'="" S C0XPRE=ZX_C0XPRE ; add the namespace prefix
332 . . I C0XPRE[":" D ; expand using vocabulary
333 . . . N ZB,ZA
334 . . . S ZB=$P(C0XPRE,":",1)
335 . . . S ZA=$P(C0XPRE,":",2)
336 . . . I $G(C0XVOC(ZB))'="" D ;
337 . . . . S C0XPRE=C0XVOC(ZB)_ZA ; expanded
338 . . S ZY=$G(@ZDOM@(ZJ,"A","rdf:resource")) ; potential object
339 . . I ZY'="" D Q ;
340 . . . S C0XOBJ=$$EXT^C0XUTIL(ZY) ; object
341 . . . D ADD(ZGRF,C0XSUB,C0XPRE,C0XOBJ) ; finally. our first real triple
342 . . ; -- this is an else because of the quit above
343 . . S ZX=$G(@ZDOM@(ZJ,"A","rdf:nodeID")) ; fishing for nodeId object
344 . . I ZX'="" D Q ; got one
345 . . . S C0XOBJ=ZX ; we are using the incoming nodeIDs as object/subject
346 . . . ; without change... this could be foolish .. look at it again later
347 . . . D ADD(ZGRF,C0XSUB,C0XPRE,C0XOBJ) ; go for it and add a node
348 . . S C0XOBJ=$G(@ZDOM@(ZJ,"T",1)) ; hopefully an object is here
349 . . I C0XOBJ="" D Q ; not a happy situation
350 . . . W !,"ERROR, NO OBJECT FOUND FOR NODE: ",ZJ
351 . . S C0XOBJ=$$EXT^C0XUTIL(C0XOBJ) ; might be namespaced
352 . . D ADD(ZGRF,C0XSUB,C0XPRE,C0XOBJ) ; go for it and add a node
353 S C0XTRP=$$NOW^XLFDT ; PARSE COMPLETE
354 W !,"TRIPLES COMPLETE AT ",C0XTRP
355 S C0XDIFF=$$FMDIFF^XLFDT(C0XTRP,C0XPRS,2)
356 W !," ELAPSED TIME: ",C0XDIFF," SECONDS"
357 I C0XDIFF'=0 D ;
358 . W !," APPROXIMATELY ",$P(C0XCNT/C0XDIFF,".")," TRIPLES PER SECOND"
359 W !,"INSERTING ",C0XCNT," TRIPLES"
360 I $D(C0XFDA) D ;
361 . I $G(BLKLOAD) D ;
362 . . D BULKLOAD(.C0XFDA)
363 . E D ;
364 . . D UPDIE(.C0XFDA) ; commit the updates to the file
365 ; next, mark the graph as finished
366 S C0XINS=$$NOW^XLFDT ; PARSE COMPLETE
367 W !,"INSERTION COMPLETE AT ",C0XPRS
368 S C0XDIFF=$$FMDIFF^XLFDT(C0XINS,C0XTRP,2)
369 W !," ELAPSED TIME: ",C0XDIFF," SECONDS"
370 I C0XDIFF'=0 W !," APPROXIMATELY ",$P(C0XCNT/C0XDIFF,".")," NODES PER SECOND"
371 S C0XEND=$$NOW^XLFDT
372 W !," ENDED AT: ",C0XEND
373 S C0XDIFF=$$FMDIFF^XLFDT(C0XEND,C0XSTART,2)
374 W !," ELAPSED TIME: ",C0XDIFF," SECONDS"
375 I C0XDIFF'=0 W !," APPROXIMATELY ",$P(C0XCNT/C0XDIFF,".")," TRIPLES PER SECOND"
376 Q
377 ;
378SHOW(ZN) ;
379 I '$D(C0XJOB) S C0XJOB=$J
380 N ZD
381 S ZD=$NA(^TMP("MXMLDOM",C0XJOB,1,ZN))
382 W ZD,"=",@ZD
383 F S ZD=$Q(@ZD) Q:$QS(ZD,4)'=ZN W !,ZD,"=",@ZD
384 ;ZWR ^TMP("MXMLDOM",C0XJOB,1,ZN,*)
385 Q
386 ;
387ANONS() ; RETURNS AN ANONOMOUS SUBJECT
388 Q "iDPsDPss"_$$LKY9
389 ;
390NEWG(NGRAPH,NMETA) ; CREATES A NEW META GRAPH, MARKS IT AS UNFINISHED
391 ; THEN CREATES A NEW GRAPH AND POINTS THE METAGRAPH TO IT
392 ; NGRAPH AND NMETA ARE PASSED BY REFERENCE AND ARE THE RETURN
393 S NGRAPH="G"_$$LKY9
394 S NMETA=NGRAPH_"A"
395 Q
396 ;
397STARTADD ; INITIALIZE C0XFDA AND BATCNT
398 K C0XFDA
399 K BATCNT
400 Q
401 ;
402ADD(ZG,ZS,ZP,ZO,FARY) ; ADD A TRIPLE TO THE TRIPLESTORE. ALL VALUES ARE TEXT
403 ; THE FDA IS SET UP BUT THE FILES ARE NOT UPDATED. CALL UPDIE TO COMPLETE
404 I '$D(FARY) D ;
405 . D INITFARY("C0XFARY")
406 . S FARY="C0XFARY"
407 D USEFARY(FARY)
408 I '$D(C0XCNT) S C0XCNT=0
409 N ZNODE
410 S ZNODE="N"_$$LKY17
411 N ZNARY ; GET READY TO CALL IENOFA
412 I (ZG="")!(ZS="")!(ZP="")!(ZO="") D Q ;
413 . I $G(DEBUG) W !,"Error Empty String ZG:"_ZG_" ZS:"_ZS_" ZP:"_ZP_" ZO"_ZO
414 S ZNARY("ZG",ZG)=""
415 S ZNARY("ZS",ZS)=""
416 S ZNARY("ZP",ZP)=""
417 S ZNARY("ZO",ZO)=""
418 D IENOFA(.ZIENS,.ZNARY,FARY) ; RESOLVE/ADD STRINGS
419 ;S ZGIEN=$$IENOF(ZG) ; LAYGO TO GET IEN
420 ;S ZSIEN=$$IENOF(ZS)
421 ;S ZPIEN=$$IENOF(ZP)
422 ;S ZOIEN=$$IENOF(ZO)
423 ;I $D(C0XFDA) D UPDIE ; ADD THE STRINGS IF NEEDED
424 I '$D(BATCNT) S BATCNT=0
425 S BATCNT=BATCNT+1
426 S C0XCNT=C0XCNT+1
427 I $G(BLKLOAD)=1 D ; we are using bulk load
428 . S C0XFDA(C0XTFN,BATCNT,.01)=ZNODE
429 . S C0XFDA(C0XTFN,BATCNT,.02)=$O(ZIENS("IEN","ZG",""))
430 . S C0XFDA(C0XTFN,BATCNT,.03)=$O(ZIENS("IEN","ZS",""))
431 . S C0XFDA(C0XTFN,BATCNT,.04)=$O(ZIENS("IEN","ZP",""))
432 . S C0XFDA(C0XTFN,BATCNT,.05)=$O(ZIENS("IEN","ZO",""))
433 E D ;
434 . S C0XFDA(C0XTFN,"?+"_BATCNT_",",.01)=ZNODE
435 . S C0XFDA(C0XTFN,"?+"_BATCNT_",",.02)=$O(ZIENS("IEN","ZG",""))
436 . S C0XFDA(C0XTFN,"?+"_BATCNT_",",.03)=$O(ZIENS("IEN","ZS",""))
437 . S C0XFDA(C0XTFN,"?+"_BATCNT_",",.04)=$O(ZIENS("IEN","ZP",""))
438 . S C0XFDA(C0XTFN,"?+"_BATCNT_",",.05)=$O(ZIENS("IEN","ZO",""))
439 I '$D(BATMAX) S BATMAX=10000
440 I BATCNT=BATMAX D ; BATCH IS DONE
441 . I $G(BLKLOAD) D ; bulk load
442 . . D BULKLOAD(.C0XFDA) ; bulk load the batch
443 . E D ; no bulk load
444 . . D UPDIE(.C0XFDA)
445 . K C0XFDA
446 . S BATCNT=0 ; RESET COUNTER
447 ; REMEMBER TO CALL UPDIE WHEN YOU'RE DONE
448 Q
449 ;
450LKY5() ;EXTRINIC THAT RETURNS A RANDOM 5 DIGIT NUMBER. USED FOR GENERATING
451 ; UNIQUE NODE AND GRAPH NAMES
452 N ZN,ZI
453 S ZN=""
454 F ZI=1:1:5 D ;
455 . S ZN=ZN_$R(10)
456 Q ZN
457 ;
458LKY9() ;EXTRINIC THAT RETURNS A RANDOM 9 DIGIT NUMBER. USED FOR GENERATING
459 ; UNIQUE NODE AND GRAPH NAMES
460 N ZN,ZI
461 S ZN=""
462 F ZI=1:1:9 D ;
463 . S ZN=ZN_$R(10)
464 Q ZN
465 ;
466LKY17() ;EXTRINIC THAT RETURNS A RANDOM 9 DIGIT NUMBER. USED FOR GENERATING
467 ; UNIQUE NODE AND GRAPH NAMES
468 N ZN,ZI
469 S ZN=""
470 F ZI=1:1:17 D ;
471 . S ZN=ZN_$R(10)
472 Q ZN
473 ;
474 ; these routines add the string if it is not found
475 ;
476IENOF(ZSTRING,FARY) ; EXTRINSIC WHICH RETURNS THE IEN OF ZS IN THE STRINGS FILE
477 I '$D(FARY) D ;
478 . D INITFARY("C0XFARY")
479 . S FARY="C0XFARY"
480 N ZIEN
481 I $G(ZSTRING)="" Q "" ; NO STRING
482 S ZIEN=$O(@C0XSN@("B",ZSTRING,""))
483 I ZIEN="" D ;
484 . S C0XFDA2(C0XSFN,"+1,",.01)=ZSTRING
485 . D UPDIE(.C0XFDA2)
486 . S ZIEN=$O(@C0XSN@("B",ZSTRING,""))
487 . K C0XFDA2
488 Q ZIEN
489 ;
490IENOFA(ZOUTARY,INARY,FARY) ; RESOLVE STRINGS TO IEN IN STRINGS FILE
491 ; OR ADD THEM IF
492 ; MISSING. ZINARY AND ZOUTARY ARE PASSED BY REFERENCE
493 ; ZINARY LOOKS LIKE ZINARY("VAR","VAL")=""
494 ; RETURNS IN ZOUTARY OF THE FORM ZOUTARY("IEN","VAR",IEN)=""
495 I '$D(FARY) D ;
496 . D INITFARY("C0XFARY")
497 . S FARY="C0XFARY"
498 K ZOUTARY ; START WITH CLEAN RESULTS
499 K C0XFDA2 ; USE A SEPARATE FDA FOR THIS
500 I '$D(C0XVOC) D VOCINIT^C0XUTIL
501 N ZINARY
502 N ZI S ZI=""
503 F S ZI=$O(INARY(ZI)) Q:ZI="" D ;
504 . N ZK
505 . S ZK=$O(INARY(ZI,""))
506 . S ZINARY($$EXT^C0XUTIL(ZI),$$EXT^C0XUTIL(ZK))=""
507 N ZV,ZIEN,ABORT
508 S ABORT=0
509 N ZCNT S ZCNT=0
510 F S ZI=$O(ZINARY(ZI)) Q:(ZI="")!+ABORT D ; LOOK FOR MISSING STRINGS
511 . S ZV=$O(ZINARY(ZI,""))
512 . I ZV="" S ABORT=1 Q ; abandon quad -- missing an entry
513 . I ZV["^" S ZV=$TR(ZV,"^","|")
514 . I $O(@C0XSN@("B",ZV,""))="" D ;
515 . . S ZCNT=ZCNT+1
516 . . S C0XFDA2(C0XSFN,"+"_ZCNT_",",.01)=ZV
517 I +ABORT Q ;
518 I $D(C0XFDA2) D ;
519 . D UPDIE(.C0XFDA2) ; ADD MISSING STRINGS
520 . K C0XFDA2 ; CLEAN UP
521 F S ZI=$O(ZINARY(ZI)) Q:ZI="" D ; NOW GET ALL IENS
522 . S ZV=$O(ZINARY(ZI,""))
523 . I ZV["^" S ZV=$TR(ZV,"^","|")
524 . S ZIEN=$O(@C0XSN@("B",ZV,"")) ; THEY SHOULD BE THERE NOW
525 . I ZIEN="" D ;
526 . . W !,"ERROR ADDING STRING: ",ZV
527 . . B
528 . S ZOUTARY("IEN",ZI,ZIEN)=""
529 Q
530 ;
531ADDINN(ZG,ZS,ZARY) ; ADD IF NOT NULL
532 ; ZG IS THE GRAPH NAME, PASSED BY VALUE
533 ; ZS IS THE SUBJECT, PASSED BY VALUE
534 ; ZARY IS AN ARRAY, PASSED BY REFERENCE OF THE PREDICATE AND OBJECT
535 ; FORMAT IS ZARY(PRED)=OBJ
536 N ZI S ZI=""
537 F S ZI=$O(ZARY(ZI)) Q:ZI="" D ;
538 . ;I ZARY(ZI)="" S ZARY(ZI)="NULL"
539 . I ZARY(ZI)'="" D ;
540 . . D ADD^C0XF2N(ZG,ZS,ZI,ZARY(ZI))
541 . . I $D(DEBUG) W !,"ADDING",ZI," ",ZARY(ZI)
542 ;ZWR ZARY
543 Q
544 ;
545BULKLOAD(ZBFDA) ; BULK LOADER FOR LOADING TRIPLES INTO FILE 172.101
546 ; USING GLOBAL SETS INSTEAD OF UPDATE^DIE
547 ; QUITS IF FILE IS NOT 172.101
548 ; EXPECTS AN FDA WITHOUT STRINGS FOR THE IENS, STARTING AT 1
549 ; QUITS IF FIRST ENTRY IS NOT IENS 1
550 ; ASSUMES THAT THE LAST IENS IS THE COUNT OF ENTRIES
551 ; ZBFDA IS PASSED BY REFERENCE
552 ;
553 ; -- reserves a block of iens from file 172.101 by locking the zero node
554 ; -- ^C0X(101,0) and adding the count of entries to piece 2 and 3
555 ; -- then unlocking to minimize the duration of the lock
556 ;
557 I $D(DEBUG) W !,"USING BULKLOAD"
558 I '$D(ZBFDA) Q ; EMPTY FDA
559 I $O(ZBFDA(""))'=172.101 Q ; WRONG FILE
560 N ZCNT,ZP3,ZP4
561 ; -- find the number of nodes to insert
562 S ZCNT=$O(ZBFDA(172.101,""),-1)
563 I ZCNT="" D Q ;
564 . W !,"ERROR IN BULK LOAD - INVALID NODE COUNT"
565 . B
566 ; -- lock the zero node and reserve a block of iens to insert
567 I $D(DEBUG) W !,"LOCKING ZERO NODE"
568 LOCK +^C0X(101,0)
569 S ZP3=$P(^C0X(101,0),U,3)
570 S ZP4=$P(^C0X(101,0),U,4)
571 S $P(^C0X(101,0),U,3)=ZP3+ZCNT+1
572 S $P(^C0X(101,0),U,4)=ZP4+ZCNT+1
573 LOCK -^C0X(101,0)
574 N ZI,ZN,ZG,ZS,ZP,ZO,ZIEN,ZBASE
575 S ZBASE=ZP3 ; the last ien in the file
576 I $D(DEBUG) W !,"ZERO NODE UNLOCKED, IENS RESERVED=",ZCNT
577 I $D(DEBUG) W !,$$NOW^XLFDT
578 S ZI=""
579 F S ZI=$O(ZBFDA(172.101,ZI)) Q:ZI="" D ;
580 . S ZN=$G(ZBFDA(172.101,ZI,.01)) ; node name
581 . I ZN="" D BLKERR Q ;
582 . S ZG=$G(ZBFDA(172.101,ZI,.02)) ; graph pointer
583 . I ZG="" D BLKERR Q ;
584 . S ZS=$G(ZBFDA(172.101,ZI,.03)) ; subject pointer
585 . I ZS="" D BLKERR Q ;
586 . S ZP=$G(ZBFDA(172.101,ZI,.04)) ; predicate pointer
587 . I ZP="" D BLKERR Q ;
588 . S ZO=$G(ZBFDA(172.101,ZI,.05)) ; object pointer
589 . I ZO="" D BLKERR Q ;
590 . S ZIEN=ZI+ZBASE ; the new ien
591 . S ^C0X(101,ZIEN,0)=ZN_U_ZG_U_ZS_U_ZP_U_ZO ; set the zero node
592 . D INDEX(ZIEN,ZN,ZG,ZS,ZP,ZO)
593 Q
594 ;
595INDEX(ZIEN,ZN,ZG,ZS,ZP,ZO) ; HARD SET THE INDEX FOR ONE ENTRY
596 S ^C0X(101,"B",ZN,ZIEN)="" ; the B index
597 S ^C0X(101,"G",ZG,ZIEN)="" ; the G for Graph index
598 S ^C0X(101,"SPO",ZS,ZP,ZO,ZIEN)=""
599 S ^C0X(101,"SOP",ZS,ZO,ZP,ZIEN)=""
600 S ^C0X(101,"OPS",ZO,ZP,ZS,ZIEN)=""
601 S ^C0X(101,"OSP",ZO,ZS,ZP,ZIEN)=""
602 S ^C0X(101,"PSO",ZP,ZS,ZO,ZIEN)=""
603 S ^C0X(101,"POS",ZP,ZO,ZS,ZIEN)=""
604 ;S ^C0X(101,"GOPS",ZG,ZO,ZP,ZS,ZIEN)=""
605 ;S ^C0X(101,"GOSP",ZG,ZO,ZS,ZP,ZIEN)=""
606 ;S ^C0X(101,"GPSO",ZG,ZP,ZS,ZO,ZIEN)=""
607 ;S ^C0X(101,"GPOS",ZG,ZP,ZO,ZS,ZIEN)=""
608 ;S ^C0X(101,"GSPO",ZG,ZS,ZP,ZO,ZIEN)=""
609 ;S ^C0X(101,"GSOP",ZG,ZS,ZO,ZP,ZIEN)=""
610 Q
611 ;
612REINDEX ; REINDEX THE ^C0X(101, TRIPLE STORE
613 K ^C0X(101,"B")
614 K ^C0X(101,"G")
615 K ^C0X(101,"SPO")
616 K ^C0X(101,"SOP")
617 K ^C0X(101,"OPS")
618 K ^C0X(101,"OSP")
619 K ^C0X(101,"PSO")
620 K ^C0X(101,"POS")
621 K ^C0X(101,"GOPS")
622 K ^C0X(101,"GOSP")
623 K ^C0X(101,"GPSO")
624 K ^C0X(101,"GPOS")
625 K ^C0X(101,"GSPO")
626 K ^C0X(101,"GSOP")
627 N ZIEN,ZZ
628 S ZIEN=0
629 F S ZIEN=$O(^C0X(101,ZIEN)) Q:+ZIEN=0 D ; FOR EACH NODE
630 . S ZZ=$G(^C0X(101,ZIEN,0))
631 . I ZZ="" D Q ;
632 . . W !,"ERROR REINDEXING NODE ",ZI
633 . S ZN=$P(ZZ,"^",1)
634 . S ZG=$P(ZZ,"^",2)
635 . S ZS=$P(ZZ,"^",3)
636 . S ZP=$P(ZZ,"^",4)
637 . S ZO=$P(ZZ,"^",5)
638 . D INDEX(ZIEN,ZN,ZG,ZS,ZP,ZO)
639 Q
640 ;
641BLKERR ;
642 W !,"ERROR IN BULK LOAD"
643 S C0XERR="ERROR IN BULK LOAD"
644 S C0XLOC=ZBFDA(ZI)
645 D ^%ZTER ; report the error
646 B
647 Q
648 ;
649DELGRAPH(ZGRF,FARY) ; delete a graph from the triplestore
650 ; (doesn't delete strings)
651 ;
652 I '$D(FARY) D ;
653 . D INITFARY("C0XFARY")
654 . S FARY="C0XFARY"
655 D USEFARY(FARY)
656 N ZGRAPH
657 D TING(.ZGRAPH,ZGRF,FARY)
658 I '$D(ZGRAPH) D Q ;
659 . I $D(DEBUG) W !,"NO TRIPLES IN GRAPH"
660 K C0XFDA
661 N ZI S ZI=""
662 F S ZI=$O(ZGRAPH(ZI)) Q:ZI="" D ;
663 . S C0XFDA(C0XTFN,ZI_",",.01)="@"
664 D UPDIE(.C0XFDA)
665 Q
666 ;
667TING(ZRTN,ZGRF,FARY) ; return the iens for graph ZGRF
668 ; ZRTN is passed by reference
669 I '$D(FARY) D ;
670 . D INITFARY("C0XFARY")
671 . S FARY="C0XFARY"
672 D USEFARY(FARY)
673 K ZRTN
674 N ZI,ZG S ZI=""
675 S ZG=$$IENOF^C0XGET1(ZGRF)
676 I ZG="" D Q ;
677 . I $D(DEBUG) W !,"ERROR GRAPH NOT FOUND"
678 I '$D(@C0XTN@("G",ZG)) Q ;
679 F S ZI=$O(@C0XTN@("G",ZG,ZI)) Q:ZI="" D ;
680 . S ZRTN(ZI)=""
681 Q
682 ;
683SWUPDIE(ZFDA) ; SWITCH BETWEEN UPDIE AND BULKLOAD
684 I $G(BLKLOAD)=1 D ; bulk load
685 . D BULKLOAD(.ZFDA) ; bulk load the batch
686 E D ; no bulk load
687 . D UPDIE(.ZFDA)
688 K ZFDA
689 Q
690 ;
691UPDIE(ZFDA) ; INTERNAL ROUTINE TO CALL UPDATE^DIE AND CHECK FOR ERRORS
692 ; ZFDA IS PASSED BY REFERENCE
693 ;ZWR ZFDA
694 ;B
695 K ZERR
696 D CLEAN^DILF
697 D UPDATE^DIE("","ZFDA","","ZERR")
698 I $D(ZERR) S ZZERR=ZZERR ; ZZERR DOESN'T EXIST,
699 ; INVOKE THE ERROR TRAP IF TASKED
700 ;. W "ERROR",!
701 ;. ZWR ZERR
702 ;. B
703 K ZFDA
704 Q
705 ;
Note: See TracBrowser for help on using the repository browser.