NCBI C++ ToolKit
|
Search Toolkit Book for Parser
#include <objtools/flatfile/flatfile_parse_info.hpp>
Classes | |
struct | SFindPubOptions |
Public Types | |
enum class | EOutput { BioseqSet , Seqsubmit } |
enum class | EMode { Release , HTGS , HTGSCON , Relaxed } |
enum class | ESource { unknown , NCBI , EMBL , GenBank , DDBJ , LANL , SPROT , Refseq , Flybase , USPTO , All } |
enum class | EFormat { unknown , EMBL , GenBank , SPROT , DDBJ , XML , ALL } |
Public Member Functions | |
Indexblk * | CurEntry () |
size_t | GetNumEntries () const |
Parser () | |
virtual | ~Parser () |
void | InitializeKeywordParser (EFormat) |
CKeywordParser & | KeywordParser () |
Private Attributes | |
CKeywordParser * | mpKeywordParser |
Definition at line 66 of file flatfile_parse_info.hpp.
|
strong |
Enumerator | |
---|---|
unknown | |
EMBL | |
GenBank | |
SPROT | |
DDBJ | |
XML | |
ALL |
Definition at line 94 of file flatfile_parse_info.hpp.
|
strong |
Enumerator | |
---|---|
Release | |
HTGS | |
HTGSCON | |
Relaxed |
Definition at line 73 of file flatfile_parse_info.hpp.
|
strong |
Enumerator | |
---|---|
BioseqSet | |
Seqsubmit |
Definition at line 68 of file flatfile_parse_info.hpp.
|
strong |
Enumerator | |
---|---|
unknown | |
NCBI | |
EMBL | |
GenBank | |
DDBJ | |
LANL | |
SPROT | |
Refseq | |
Flybase | |
USPTO | |
All |
Definition at line 80 of file flatfile_parse_info.hpp.
Parser::Parser | ( | ) |
Definition at line 44 of file flatfile_parse_info.cpp.
|
virtual |
Definition at line 62 of file flatfile_parse_info.cpp.
References mpKeywordParser, and ResetParserStruct().
|
inline |
Definition at line 109 of file flatfile_parse_info.hpp.
|
inline |
Definition at line 110 of file flatfile_parse_info.hpp.
References indx.
void Parser::InitializeKeywordParser | ( | EFormat | fmt | ) |
Definition at line 49 of file flatfile_parse_info.cpp.
References mpKeywordParser.
Referenced by sParseFlatfile().
CKeywordParser & Parser::KeywordParser | ( | ) |
Definition at line 56 of file flatfile_parse_info.cpp.
References _ASSERT, and mpKeywordParser.
Referenced by EmblIndex(), GetDescrEmblBlock(), and GetEmblGBBlock().
Definition at line 180 of file flatfile_parse_info.hpp.
Referenced by FillAccsBySource(), fta_init_pp(), and GetAccession().
Definition at line 183 of file flatfile_parse_info.hpp.
Referenced by add_entry(), CheckDupEntries(), CheckGene(), CkCdRegion(), CkProteinTransl(), CreateEntryBioseq(), EmblAscii(), EmblIndex(), FillAccsBySource(), flat2asn_range_func(), Flat2AsnCheck(), fta_add_hist(), fta_init_pp(), fta_parse_buf(), GenBankAscii(), GenBankAsciiOrig(), GenBankIndex(), get_sequence_text(), GetAccession(), GetEmblInstContig(), GetGenBankInstContig(), GetOneGeneRef(), GetProtRefSeqId(), GetSeqExt(), GetSeqLocation(), GetSprotDescr(), GetSPSeqLoc(), LoadFeat(), QSIndex(), sParseFlatfile(), SPFeatProtRef(), SPGetOneGeneRefNew(), SprotAscii(), XMLAscii(), XMLCheckRequiredTags(), XMLGetInstContig(), and XMLIndex().
Definition at line 135 of file flatfile_parse_info.hpp.
Referenced by FillAccsBySource(), fta_init_pp(), and GetAccession().
Definition at line 130 of file flatfile_parse_info.hpp.
Referenced by FillAccsBySource(), fta_init_pp(), fta_set_format_source(), IsPatentedAccPrefix(), IsTLSAccPrefix(), IsTPAAccPrefix(), IsTSAAccPrefix(), and IsWGSAccPrefix().
Definition at line 210 of file flatfile_parse_info.hpp.
Referenced by Flat2AsnCheck(), fta_fix_seq_loc_id(), fta_init_pp(), GetEmblInstContig(), GetGenBankInstContig(), and XMLGetInstContig().
Definition at line 194 of file flatfile_parse_info.hpp.
Referenced by fta_add_hist(), GetDescrEmblBlock(), GetDescrSPBlock(), GetEmblGBBlock(), GetGBBlock(), XMLGetEMBLBlock(), and XMLGetGBBlock().
string Parser::authors_str |
Definition at line 118 of file flatfile_parse_info.hpp.
Referenced by GetAuthorsStr(), and MakeSeqSubmit().
optional<string> Parser::buf |
Definition at line 217 of file flatfile_parse_info.hpp.
Referenced by CkCdRegion(), flat2asn_range_func(), GetEmblInstContig(), GetGenBankInstContig(), ParseSourceFeat(), ProcFeatBlk(), SeqFeatPub(), SpProcFeatBlk(), and XMLGetInstContig().
Definition at line 172 of file flatfile_parse_info.hpp.
Referenced by FillAccsBySource(), fta_init_pp(), GenBankAsciiOrig(), OutputEmblAsn(), SpPrepareEntry(), and XMLAscii().
Int4 Parser::cleanup = 0 |
Definition at line 205 of file flatfile_parse_info.hpp.
Referenced by Flat2AsnCheck(), fta_init_pp(), GenBankAsciiOrig(), OutputEmblAsn(), and XMLAscii().
Definition at line 179 of file flatfile_parse_info.hpp.
Referenced by Flat2AsnCheck(), fta_init_pp(), GenBankAsciiOrig(), OutputEmblAsn(), and XMLAscii().
Int4 Parser::curindx = 0 |
Definition at line 108 of file flatfile_parse_info.hpp.
Referenced by BuildBioSegHeader(), check_short_CDS(), CheckDivCode(), CheckGene(), CkNonTerSP(), CkSegmentSet(), CollectGapFeats(), CreateEntryBioseq(), CreateRawBioSources(), CurEntry(), DealWithGenes(), DescrRefs(), EmblAscii(), EmblIndex(), CFindPub::fix_pub_equiv(), flat2asn_range_func(), fta_fix_seq_loc_id(), fta_get_genetic_code(), fta_init_pp(), fta_is_con_div(), fta_replace_org(), GenBankAscii(), GenBankAsciiOrig(), GenBankIndex(), get_bioseq(), get_pat(), get_sub(), GetBioseq(), GetDescrEmblBlock(), GetDescrSPBlock(), GetEmblDescr(), GetEmblGBBlock(), GetEmblInst(), GetEmblMolInfo(), GetFlatBiomol(), GetGBBlock(), GetGenBankDescr(), GetGenBankInst(), GetGenBankMolInfo(), GetOneGeneRef(), GetProtRefSeqId(), GetSeqData(), GetSeqExt(), GetSPAnnot(), GetSprotDescr(), GetSPSeqLoc(), InternalStopCodon(), Entry::IsAA(), LoadFeat(), OutputEmblAsn(), parse_entry(), ParseSourceFeat(), ProcFeatBlk(), ProcNucProt(), ResetParserStruct(), SPFeatProtRef(), SPGetGeneRefsNew(), SPGetOneGeneRefNew(), SpPrepareEntry(), SprotAscii(), SprotIndex(), SrchCdRegion(), Entry::xInitSeqInst(), XMLAscii(), XMLGetDescr(), XMLGetEMBLBlock(), XMLGetGBBlock(), XMLGetInst(), XMLGetMolInfo(), XMLIndex(), and XMLLoadEntry().
Definition at line 168 of file flatfile_parse_info.hpp.
Referenced by fta_init_pp(), GetGenBankDescr(), and XMLGetDescr().
Definition at line 175 of file flatfile_parse_info.hpp.
Referenced by CkProteinTransl(), CkSegmentSet(), EmblAscii(), fta_init_pp(), GenBankAsciiOrig(), InternalStopCodon(), LoadFeat(), ProcFeatBlk(), SeqFeatPub(), SpProcFeatBlk(), and XMLAscii().
Definition at line 191 of file flatfile_parse_info.hpp.
Referenced by CheckGene().
Uint1 Parser::entrez_fetch = 0 |
Definition at line 140 of file flatfile_parse_info.hpp.
Referenced by fta_add_hist(), fta_init_pp(), fta_is_con_div(), and fta_parse_buf().
TEntryList Parser::entries |
Definition at line 120 of file flatfile_parse_info.hpp.
Referenced by CloseAll(), fta_parse_buf(), GenBankAsciiOrig(), MakeBioseqSet(), MakeSeqSubmit(), OutputEmblAsn(), SprotAscii(), and XMLAscii().
vector<IndexblkPtr> Parser::entrylist |
Definition at line 107 of file flatfile_parse_info.hpp.
Referenced by add_entry(), BuildBioSegHeader(), check_short_CDS(), CheckDivCode(), CheckDupEntries(), CheckGene(), CkNonTerSP(), CkSegmentSet(), CollectGapFeats(), CreateEntryBioseq(), CreateRawBioSources(), CurEntry(), DealWithGenes(), DescrRefs(), EmblAscii(), EmblIndex(), EmblSegment(), CFindPub::fix_pub_equiv(), flat2asn_range_func(), fta_fix_seq_loc_id(), fta_get_genetic_code(), fta_init_pp(), fta_is_con_div(), fta_parse_buf(), fta_replace_org(), GenBankAscii(), GenBankAsciiOrig(), GenBankIndex(), get_bioseq(), get_pat(), get_sub(), GetBioseq(), GetDescrEmblBlock(), GetDescrSPBlock(), GetEmblDescr(), GetEmblGBBlock(), GetEmblInst(), GetEmblMolInfo(), GetFlatBiomol(), GetGBBlock(), GetGenBankDescr(), GetGenBankInst(), GetGenBankMolInfo(), GetOneGeneRef(), GetProtRefSeqId(), GetSeqData(), GetSeqExt(), GetSPAnnot(), GetSprotDescr(), GetSPSeqLoc(), InternalStopCodon(), Entry::IsAA(), LoadFeat(), OutputEmblAsn(), parse_entry(), ParseSourceFeat(), ProcFeatBlk(), ProcNucProt(), ResetParserStruct(), sParseFlatfile(), SPFeatProtRef(), SPGetGeneRefsNew(), SPGetOneGeneRefNew(), SpPrepareEntry(), SprotAscii(), SprotIndex(), SrchCdRegion(), Entry::xInitSeqInst(), XMLAscii(), XMLGetDescr(), XMLGetEMBLBlock(), XMLGetGBBlock(), XMLGetInst(), XMLGetMolInfo(), XMLIndex(), XMLLoadEntry(), and XMLPerformIndex().
Int4 Parser::errstat = 0 |
Definition at line 193 of file flatfile_parse_info.hpp.
Referenced by ParseSourceFeat().
Definition at line 222 of file flatfile_parse_info.hpp.
Referenced by flat2asn_range_func(), and get_bioseq().
Definition at line 224 of file flatfile_parse_info.hpp.
Referenced by fta_init_pp(), and get_sequence_text().
Definition at line 228 of file flatfile_parse_info.hpp.
Referenced by fta_init_pp(), and get_sequence_text().
Definition at line 225 of file flatfile_parse_info.hpp.
Referenced by fta_init_pp(), and get_sequence_text().
Definition at line 229 of file flatfile_parse_info.hpp.
Referenced by fta_init_pp(), and get_sequence_text().
Definition at line 226 of file flatfile_parse_info.hpp.
Referenced by EmblAscii(), fta_init_pp(), GenBankAsciiOrig(), and XMLAscii().
Definition at line 227 of file flatfile_parse_info.hpp.
Referenced by EmblAscii(), fta_init_pp(), GenBankAsciiOrig(), and XMLAscii().
FileBuf Parser::ffbuf |
Definition at line 115 of file flatfile_parse_info.hpp.
Referenced by EmblIndex(), Flat2AsnCheck(), fta_parse_buf(), GenBankIndex(), LoadEntry(), LoadEntryGenbank(), CFlatFileParser::Parse(), and SprotIndex().
Definition at line 221 of file flatfile_parse_info.hpp.
Referenced by flat2asn_range_func(), and fta_init_pp().
EFormat Parser::format = EFormat::unknown |
Definition at line 128 of file flatfile_parse_info.hpp.
Referenced by add_entry(), CollectGapFeats(), DescrRefs(), EmblAscii(), FillAccsBySource(), Flat2AsnCheck(), FlatFileIndex(), fta_parse_buf(), fta_set_format_source(), GenBankAsciiOrig(), get_art(), get_bioseq(), get_pat(), GetAccession(), GetDescrEmblBlock(), GetFlatBiomol(), GetGBBlock(), GetSeqData(), ImpFeatPub(), InitialEntry(), journal(), LoadEntry(), LoadEntryGenbank(), LoadFeat(), parse_entry(), SeqFeatPub(), SetReleaseStr(), sParseFlatfile(), SpPrepareEntry(), and XMLAscii().
SFindPubOptions Parser::fpo |
Definition at line 167 of file flatfile_parse_info.hpp.
Referenced by CFindPub::CFindPub(), and fta_fill_find_pub_option().
Definition at line 211 of file flatfile_parse_info.hpp.
Referenced by DealWithGenes(), Flat2AsnCheck(), and fta_init_pp().
Definition at line 184 of file flatfile_parse_info.hpp.
Referenced by fta_add_hist(), fta_init_pp(), and GetSprotDescr().
Definition at line 188 of file flatfile_parse_info.hpp.
Referenced by EmblAscii(), fta_init_pp(), GenBankAsciiOrig(), and XMLAscii().
Definition at line 186 of file flatfile_parse_info.hpp.
Referenced by GetProtRefSeqId().
Definition at line 185 of file flatfile_parse_info.hpp.
Referenced by fta_init_pp(), and GenBankIndex().
Int4 Parser::indx = 0 |
Definition at line 105 of file flatfile_parse_info.hpp.
Referenced by add_entry(), CheckDupEntries(), CkSegmentSet(), EmblAscii(), EmblIndex(), EmblSegment(), flat2asn_range_func(), fta_init_pp(), fta_parse_buf(), GenBankAscii(), GenBankAsciiOrig(), GenBankIndex(), GetNumEntries(), QSIndex(), ResetParserStruct(), sParseFlatfile(), SprotAscii(), SprotIndex(), XMLAscii(), XMLIndex(), and XMLPerformIndex().
Int4 Parser::limit = 0 |
Definition at line 124 of file flatfile_parse_info.hpp.
Referenced by EmblAscii(), Flat2AsnCheck(), fta_init_pp(), GenBankAsciiOrig(), OutputEmblAsn(), and XMLAscii().
Uint1 Parser::medserver = 0 |
Definition at line 148 of file flatfile_parse_info.hpp.
Referenced by embl_refs(), Flat2AsnCheck(), fta_find_pub_explore(), fta_fini_servers(), fta_init_pp(), fta_init_servers(), fta_parse_buf(), gb_refs_common(), and XMLRefs().
EMode Parser::mode = EMode::Release |
Definition at line 189 of file flatfile_parse_info.hpp.
Referenced by CkCdRegion(), CreateEntryBioseq(), DescrRefs(), FillAccsBySource(), Flat2AsnCheck(), fta_init_pp(), GenBankAsciiOrig(), GenBankIndex(), GetAccession(), GetGBBlock(), GetProtRefSeqId(), InitialEntry(), and LoadFeat().
|
private |
Definition at line 241 of file flatfile_parse_info.hpp.
Referenced by InitializeKeywordParser(), KeywordParser(), and ~Parser().
Definition at line 177 of file flatfile_parse_info.hpp.
Referenced by CkCdRegion(), fta_get_genetic_code(), fta_init_pp(), InternalStopCodon(), and ProcNucProt().
Definition at line 170 of file flatfile_parse_info.hpp.
Referenced by fta_init_pp(), GenBankAsciiOrig(), GetEmblDescr(), GetGenBankDescr(), XMLAscii(), and XMLGetDescr().
Definition at line 150 of file flatfile_parse_info.hpp.
Referenced by fta_find_pub_explore(), and fta_init_servers().
Int4 Parser::num_drop = 0 |
Definition at line 133 of file flatfile_parse_info.hpp.
Referenced by CkSegmentSet(), EmblIndex(), fta_init_pp(), fta_parse_buf(), GenBankIndex(), sParseFlatfile(), SprotIndex(), and XMLIndex().
EOutput Parser::output_format = EOutput::BioseqSet |
Definition at line 218 of file flatfile_parse_info.hpp.
Referenced by CloseAll(), and sParseFlatfile().
ProtBlkPtr Parser::pbp = nullptr |
Definition at line 146 of file flatfile_parse_info.hpp.
Referenced by CkCdRegion(), FindCd(), fta_get_genetic_code(), fta_init_pp(), fta_parse_buf(), GetGcode(), GuessGeneticCode(), ProcNucProt(), ResetParserStruct(), sParseFlatfile(), and SrchCdRegion().
Definition at line 216 of file flatfile_parse_info.hpp.
Referenced by CFindPub::fix_pub_annot(), Flat2AsnCheck(), fta_init_pp(), GenBankAsciiOrig(), LoadFeat(), MakeBioseqSet(), OutputEmblAsn(), and XMLAscii().
FILE* Parser::qsfd = nullptr |
Definition at line 215 of file flatfile_parse_info.hpp.
Referenced by CloseFiles(), EmblAscii(), EmblIndex(), Flat2AsnCheck(), fta_init_pp(), GenBankAsciiOrig(), GenBankIndex(), QSIndex(), and XMLAscii().
Definition at line 212 of file flatfile_parse_info.hpp.
Referenced by Flat2AsnCheck(), fta_init_pp(), and QSIndex().
string Parser::release_str |
Definition at line 117 of file flatfile_parse_info.hpp.
Referenced by MakeBioseqSet(), and SetReleaseStr().
Definition at line 178 of file flatfile_parse_info.hpp.
Referenced by fta_init_pp(), and GetBioseq().
Definition at line 176 of file flatfile_parse_info.hpp.
Referenced by EmblAscii(), EmblIndex(), and fta_init_pp().
Uint1 Parser::seqtype = 0 |
Definition at line 131 of file flatfile_parse_info.hpp.
Referenced by CreateEntryBioseq(), FillAccsBySource(), fta_init_pp(), GetBioseq(), GetSeqExt(), GetSPSeqLoc(), journal(), and LoadFeat().
Definition at line 202 of file flatfile_parse_info.hpp.
Referenced by CheckGene(), and fta_init_pp().
Definition at line 174 of file flatfile_parse_info.hpp.
Referenced by Flat2AsnCheck(), fta_init_pp(), fta_parse_buf(), and sParseFlatfile().
ESource Parser::source = ESource::unknown |
Definition at line 129 of file flatfile_parse_info.hpp.
Referenced by BldProtRefSeqEntry(), CkCdRegion(), CollectGapFeats(), CreateEntryBioseq(), DealWithGenes(), DescrRefs(), EmblAscii(), EmblIndex(), FillAccsBySource(), FindCd(), CFindPub::fix_pub_annot(), flat2asn_range_func(), fta_add_hist(), fta_fix_seq_loc_id(), fta_replace_org(), GenBankAscii(), GenBankAsciiOrig(), GenBankIndex(), get_art(), get_pat(), get_sub(), get_sub_gsdb(), GetAccession(), GetAuthorsStr(), GetDescrEmblBlock(), GetDescrSPBlock(), GetEmblDescr(), GetEmblGBBlock(), GetEmblInst(), GetFlatBiomol(), GetGBBlock(), GetGenBankDescr(), GetProtRefSeqId(), GetSeqData(), GetSPDate(), GetSprotDescr(), InitialEntry(), IsPatentedAccPrefix(), IsTLSAccPrefix(), IsTPAAccPrefix(), IsTSAAccPrefix(), IsWGSAccPrefix(), journal(), LoadEntry(), LoadEntryGenbank(), LoadFeat(), ParseSourceFeat(), SetReleaseStr(), sp_refs(), SprotIndex(), XMLAscii(), XMLCheckRequiredTags(), XMLGetDescr(), XMLGetEMBLBlock(), XMLGetGBBlock(), XMLIndex(), and XMLRefs().
Definition at line 198 of file flatfile_parse_info.hpp.
Referenced by Flat2AsnCheck(), fta_init_pp(), GetDescrSPBlock(), and SprotIndex().
Uint1 Parser::taxserver = 0 |
Definition at line 145 of file flatfile_parse_info.hpp.
Referenced by CkCdRegion(), Flat2AsnCheck(), fta_fix_orgref(), fta_fix_orgref_byid(), fta_get_genetic_code(), fta_init_pp(), fta_init_servers(), fta_parse_buf(), GetEmblDescr(), GetGenBankDescr(), InternalStopCodon(), ParseSourceFeat(), ProcNucProt(), and XMLGetDescr().
Definition at line 173 of file flatfile_parse_info.hpp.
Referenced by CkProteinTransl(), and fta_init_pp().
void* Parser::user_data = nullptr |
Definition at line 223 of file flatfile_parse_info.hpp.
Referenced by fta_init_pp().
Definition at line 197 of file flatfile_parse_info.hpp.
Referenced by GenBankAsciiOrig(), GetEmblDescr(), GetGenBankDescr(), OutputEmblAsn(), SetReleaseStr(), XMLAscii(), XMLGetDescr(), and XMLRefs().