# gnomap.properties # for dmel het fff/gnomap feature data LIB_NAME=gnomap title = FlyBase Genome Feaures # leave these to command line args? DATA_ROOT=web/data/genomes/Drosophila_melanogaster/current/fff/ # INDEX_PATH=web/genomes/Drosophila_melanogaster/current/indices/fff/ MIME_TYPE=text/tsv ## ---- search/report --------------------- ## default search field searchfield=all format=native # outfields=chr,start,feature,gene,range.stop,id resultspage = results.jsp ## for xslt to produce the result page tables # resultxsl = conf/fbab_result.xsl # resultspage = resultxsl.jsp header.native=# Chr Start Feature gene map range id db_xref notes footer.native= header.xml=\n footer.xml= xsl = gnomap.xsl # xsl = fban.xsl docurl=/cgi-bin/gbrowse_fb/dmel?id= outfields= gene,feature,chr,start,range.stop,url storefields= gene,chr,start,feature,range.stop,db_xref # displayFields = gene,chr,start,feature,range,db_xref # chr db_xref docclass docid feature gene id map modified notes # range range.start range.stop range.strand start uid url searchskip.range=1 searchskip.start=1 title.range.strand=strand title.range.stop=stop title.range.start=start ## --- field indexing ------------------- # locate data with regex file, folder patterns regex_folder=^\\w.+$ regex_file=^.*\\.fff$ regex_skipfile=.*\\.old regex_skipfolder=tmp|old.*|.*\\.old INDEX_CLASS=org.eugenes.index.LuceneTableIndexer analyzer=org.eugenes.index.BiodataAnalyzer fieldnames_lastcomment=false fieldnames_firstline=false fieldnames=chr start feature gene map range id db_xref notes regex_comment=^\\s*[!#] ## table field separator regex ## any whitespace # regex_keyval=\\s*(\\S+) ## tabs only regex_keyval=\\t*([^\\t]+) ## commas # regex_keyval=,*([^,]+) ## commas, optional quotes # regex_keyval=,*([^,]+)|,*"([^"]+)" ## append existing index or create new INDEX_APPEND=false ## index names as values (as well as field names)? INDEX_TAGS=false ## index values ? INDEX_ATTRIBUTES=false ## use fieldname xpath; full top.middle.last field name? INDEX_XPATH=false ## INDEX_LEVEL=0 means index main records one level below xml tag INDEX_LEVEL=2 INDEX_BLANKS=false merge_factor=10 max_field_length=1000000 ## memory crash cure: MAX_FIELDS=10000 # to create "contents" field of all text indexall=false ## field indexing parameters # special summary fields -- replace w/ fieldalias.TAG=newtag sumfields=docid,docclass field.docid=id field.docclass=feature ## fieldalias.OLDTAG=NEWTAG ## fieldalias precedes fieldtype.tag processing # fieldalias.GID=ID ## default - UnStored = index but dont store text fieldtype=Text # fieldtype.contents=UnStored # fieldtype.summary=UnIndexed fieldtype.ancestors=ignore ## these must always be stored; Text or UnIndexed fieldtype.docid=Text fieldtype.docclass=Text fieldtype.url=Text fieldtype.modified=Keyword analyzer=org.eugenes.index.BiodataAnalyzer ## field filters tokenfilter=org.eugenes.index.BiodataAnalyzer$DataFilter #tokenfilter.SYM=org.eugenes.index.BiodataAnalyzer$DataFilter #tokenfilter.ID=org.eugenes.index.BiodataAnalyzer$LowerDataFilter #tokenfilter.contents=org.eugenes.index.BiodataAnalyzer$LowerWordFilter # tokenfilter.len=org.eugenes.index.BiodataAnalyzer$NumberFilter tokenfilter.range.start=org.eugenes.index.BiodataAnalyzer$NumberFilter tokenfilter.range.stop=org.eugenes.index.BiodataAnalyzer$NumberFilter ## field tokenizers -- replace with filters tokenizer=org.eugenes.index.BiodataAnalyzer$LowerDataTokenizer #tokenizer.contents=org.eugenes.index.BiodataAnalyzer$LowerWordTokenizer tokenizer.db_xref=org.eugenes.index.BiodataAnalyzer$LowerWordTokenizer fieldrecoder.range=LucegeneIndexers$Location_FieldRecoder ## parse chr field from top source line #source fly 2L 1..22217931 - - - ##fieldrecoder.feature=LucegeneIndexers$FeatureSourceChr_FieldRecoder ##fieldrecoder.map=LucegeneIndexers$FeatureSourceChr_FieldRecoder