# dbs/lucegene/blastxml.properties # d.gilbert, jan 05 LIB_NAME=blastxml title = BLAST output XML # dmel-dvir-tblastn.xml DATA_ROOT=web/data/blast/ INDEX_PATH=indices/lucene/blastxml/ MIME_TYPE=text/xml ## --------- search/report keys ------------------- searchfield=all outfields=docid,queryid,Hsp_identity,Hsp_align-len,Hsp_evalue,Hsp_bit-score,url storefields=docid,queryid,Hit_id,Hsp_identity,Hsp_evalue,Hsp_bit-score,Hsp_align-len,BlastOutput_db,url # BlastOutput_query-def, docurl=lookup.jsp?id= batch.forward=lookup.jsp ## for xslt to produce the result page tables # resultxsl = conf/blast_result.xsl # resultspage = resultxsl.jsp # header.native=\n header.native=\n\ \n\ \n footer.native=\n batchformat = text/xml batchformats = text/xml, text/plain, text/csv, text/tsv title.text/xml=BLAST XML nativeformat = text/xml ## difference in header. footer. is for native file data versus lucegene index fields header.xml=\n footer.xml=\n # ---- indexing values ----------------------- # locate data with regex file, folder patterns regex_folder= regex_file=^.*blast.*\.xml$ regex_skipfile= regex_skipfolder=.* # (tmp|.*\.old) INDEX_CLASS=org.eugenes.index.LuceneXmlIndexer ## append existing index or create new INDEX_APPEND=false ## index names as values (as well as field names)? INDEX_TAGS=false ## index values ? INDEX_ATTRIBUTES=false ## use fieldname xpath; full top.middle.last field name? INDEX_XPATH=false ## INDEX_LEVEL=0 means index main records one level below xml tag INDEX_LEVEL=0 INDEX_BLANKS=false ## IndexWriter opts ## merge=10 is default; 4 == less mem usage ; 2 minimum merge_factor=6 ## max_field_length is max # terms/field max_field_length=1000000 MAX_FIELDS=50000 # to create "contents" field of all text indexall=false ## field indexing parameters ## sumfields list needs to match field.xxx common summary fields sumfields=docid,queryid # special summary fields -- replace w/ fieldalias.TAG=newtag # field.docid=ID # field.docclass=CLA # field.title=RETE # field.summary=GeneSummary.SUMMARY.text ## need some recoders; want to index each as a document # \n\n"; # while(<>){ # next if (m,^<\?xml, || m,^<\!DOCTYPE,); # if (m,<(BlastOutput_reference|BlastOutput_param|Iteration_stat),) { $skipto= $1; } # if ($skipto) { # $skipto='' if (m,,); # next; # } # print; # } # print "\n"; # trailer