CPP_DOC/doxyhtml/cleanup__utils_8cpp_source.html

 /* $Id: cleanup_utils.cpp 102112 2024-04-02 18:07:29Z stakhovv $

  * ===========================================================================

  *

  *                            PUBLIC DOMAIN NOTICE

  *               National Center for Biotechnology Information

  *

  *  This software/database is a "United States Government Work" under the

  *  terms of the United States Copyright Act.  It was written as part of

  *  the author's official duties as a United States Government employee and

  *  thus cannot be copyrighted.  This software/database is freely available

  *  to the public for use. The National Library of Medicine and the U.S.

  *  Government have not placed any restriction on its use or reproduction.

  *

  *  Although all reasonable efforts have been taken to ensure the accuracy

  *  and reliability of the software and data, the NLM and the U.S.

  *  Government do not and cannot warrant the performance or results that

  *  may be obtained by using this software or data. The NLM and the U.S.

  *  Government disclaim all warranties, express or implied, including

  *  warranties of performance, merchantability or fitness for any particular

  *  purpose.

  *

  *  Please cite the author in any work or product based on this material.

  *

  * ===========================================================================

  *

  * Author:  Mati Shomrat

  *

  * File Description:

  *   General utilities for data cleanup.

  *

  * ===========================================================================

  */

 #include <ncbi_pch.hpp>

 #include <corelib/ncbistd.hpp>

 #include "cleanup_utils.hpp"


 #include <objmgr/util/seq_loc_util.hpp>

 #include <objmgr/util/sequence.hpp>

 #include <objects/seq/Pubdesc.hpp>

 #include <objects/pub/Pub_equiv.hpp>

 #include <objects/pub/Pub.hpp>

 #include <objects/biblio/Cit_sub.hpp>

 #include <objects/biblio/Cit_gen.hpp>

 #include <objects/biblio/Auth_list.hpp>

 #include <objects/biblio/Affil.hpp>

 #include <objects/biblio/Author.hpp>

 #include <objects/biblio/Imprint.hpp>

 #include <objects/general/Date.hpp>

 #include <objects/general/Person_id.hpp>

 #include <objects/general/Name_std.hpp>


 #include <objects/seq/Seqdesc.hpp>

 #include <objects/seq/MolInfo.hpp>

 #include <objects/seq/seq_loc_from_string.hpp>

 #include <objects/seqfeat/Org_ref.hpp>

 #include <objects/misc/sequence_macros.hpp>


 #include <objmgr/seqdesc_ci.hpp>


 #include <objtools/cleanup/cleanup_pub.hpp>


 BEGIN_NCBI_SCOPE

 BEGIN_SCOPE(objects)


 #define IS_LOWER(c)     ('a'<=(c) && (c)<='z')

 #define IS_UPPER(c)     ('A'<=(c) && (c)<='Z')


 using namespace sequence;


 bool CleanVisString( string &str )

 {

     bool changed = false;


     if( str.empty() ) {

         return false;

     }


     // chop off initial junk

     {

         string::size_type first_good_char_pos = str.find_first_not_of(" ;,");

         if( first_good_char_pos == string::npos ) {

             // string is completely junk

             str.clear();

             return true;

         } else if( first_good_char_pos > 0 ) {

             copy( str.begin() + first_good_char_pos, str.end(), str.begin() );

             str.resize( str.length() - first_good_char_pos );

             changed = true;

         }

     }


     // chop off end junk


     string::size_type last_good_char_pos = str.find_last_not_of(" ;,");

     _ASSERT( last_good_char_pos != string::npos ); // we checked this case so it shouldn't happen

     if( last_good_char_pos == (str.length() - 1) ) {

         // nothing to chop of the end

         return changed;

     } else if( str[last_good_char_pos+1] == ';' ) {

         // special extra logic for semicolons because it might be part of

         // an HTML character like "&nbsp;"


         // see if there's a '&' before the semicolon

         // ( ' ' and ',' would break the '&' and make it irrelevant, though )

         string::size_type last_ampersand_pos = str.find_last_of("& ,", last_good_char_pos );

         if( last_ampersand_pos == string::npos ) {

             // no ampersand, so just chop off as normal

             str.resize( last_good_char_pos + 1 );

             return true;

         }

         switch( str[last_ampersand_pos] ) {

             case '&':

                 // can't chop semicolon, so chop just after it

                 if( (last_good_char_pos + 2) == str.length() ) {

                     // semicolon is at end, so no chopping occurs

                     return changed;

                 } else {

                     // chop after semicolon

                     str.resize( last_good_char_pos + 2 );

                     return true;

                 }

             case ' ':

             case ',':

                 // ampersand (if any) is irrelevant due to intervening

                 // space or comma

                 str.resize( last_good_char_pos + 1 );

                 return true;

             default:

                 _ASSERT(false);

                 return changed;  // should be impossible to reach here

         }


     } else {

         str.resize( last_good_char_pos + 1 );

         return true;

     }

 }


 bool CleanVisStringJunk( string &str, bool allow_ellipses )

 {

     // This is based on the C function TrimSpacesAndJunkFromEnds.

     // Although it's updated to use iterators and such and to

     // return whether it changed the string, it should

     // have the same output.


     // TODO: This function is copy-pasted from TrimSpacesAndJunkFromEnds,

     // so we should do something about that since duplicate code is evil.


     if ( str.empty() ) {

         return false;

     }


     // make start_of_junk_pos hold the beginning of the "junk" at the end

     // (where junk is defined as one of several characters)

     // while we're at it, also check if the junk contains a tilde and/or period

     bool isPeriod = false;

     bool isTilde = false;

     int start_of_junk_pos = (int)str.length() - 1;

     for( ; start_of_junk_pos >= 0 ; --start_of_junk_pos ) {

         const char ch = str[start_of_junk_pos];

         if (ch <= ' ' || ch == '.' || ch == ',' || ch == '~' || ch == ';') {

             // found junk character


             // also, keep track of whether the junk includes a period and/or tilde

             isPeriod = (isPeriod || ch == '.');

             isTilde = (isTilde || ch == '~');

         } else {

             // found non-junk character.  Last junk character is just after this

             ++start_of_junk_pos;

             break;

         }

     }

     // special case of the whole string being junk

     if( start_of_junk_pos < 0 ) {

         start_of_junk_pos = 0;

     }


     bool changed = false;


     // if there's junk, chop it off (but leave period/tildes/ellipsis as appropriate)

     if ( start_of_junk_pos < (int)str.length() ) {


         // holds the suffix to add after we remove the junk

         const char * suffix = ""; // by default, just remove junk


         const int chars_in_junk = ( (int)str.length() - start_of_junk_pos );

         _ASSERT( chars_in_junk >= 1 );

         // allow one period at end

         if (isPeriod) {

             suffix = ".";

             if ( allow_ellipses && (chars_in_junk >= 3) &&

                 str[start_of_junk_pos+1] == '.' && str[start_of_junk_pos+2] == '.' ) {

                 suffix = "...";

             }

         } else if (isTilde ) {

             // allow double tilde(s) at the end

             if ( str[start_of_junk_pos] == '~' ) {

                 const bool doubleTilde = ( (chars_in_junk >= 2) && str[start_of_junk_pos+1] == '~' );

                 suffix = ( doubleTilde  ? "~~" : "" );

             }

         }

         if( suffix[0] != '\0' ) {

             if( 0 != str.compare( start_of_junk_pos, INT_MAX, suffix) ) {

                 str.erase( start_of_junk_pos );

                 str += suffix;

                 changed = true;

             }

         } else if ( start_of_junk_pos < (int)str.length() ) {

             str.erase( start_of_junk_pos );

             changed = true;

         }

     }


     // copy the part after the initial whitespace to the destination

     string::iterator input_iter = str.begin();

     while ( input_iter != str.end() && *input_iter <= ' ') {

         ++input_iter;

     }

     if( input_iter != str.begin() ) {

         str.erase( str.begin(), input_iter );

         changed = true;

     }


     return changed;

 }


 bool  RemoveSpacesBetweenTildes(string& str)

 {

     static string whites(" \t\n\r");

     bool changed = false;

     SIZE_TYPE tilde1 = str.find('~');

     if (tilde1 == NPOS) {

         return changed; // no tildes in str.

     }

     SIZE_TYPE tilde2 = str.find_first_not_of(whites, tilde1 + 1);

     while (tilde2 != NPOS) {

         if (str[tilde2] == '~') {

             if ( tilde2 > tilde1 + 1) {

                 // found two tildes with only spaces between them.

                 str.erase(tilde1+1, tilde2 - tilde1 - 1);

                 ++tilde1;

                 changed = true;

             } else {

                 // found two tildes side by side.

                 tilde1 = tilde2;

             }

         } else {

             // found a tilde with non-space non-tilde after it.

             tilde1 = str.find('~', tilde2 + 1);

             if (tilde1 == NPOS) {

                 return changed; // no more tildes in str.

             }

         }

         tilde2 = str.find_first_not_of(whites, tilde1 + 1);

     }

     return changed;


 }


 bool CleanDoubleQuote(string& str)

 {

     bool changed = false;

     NON_CONST_ITERATE(string, it, str) {

         if (*it == '\"') {

             *it = '\'';

             changed = true;

         }

     }

     return changed;

 }


 void TrimInternalSemicolons (string& str)

 {

     size_t pos, next_pos;


     pos = NStr::Find (str, ";");

     while (pos != string::npos) {

         next_pos = pos + 1;

         bool has_space = false;

         while (next_pos < str.length() && (str[next_pos] == ';' || str[next_pos] == ' ' || str[next_pos] == '\t')) {

             if (str[next_pos] == ' ') {

                 has_space = true;

             }

             next_pos++;

         }

         if (next_pos == pos + 1 || (has_space && next_pos == pos + 2)) {

             // nothing to fix, advance semicolon search

             pos = NStr::Find (str, ";", next_pos);

         } else if (next_pos == str.length()) {

             // nothing but semicolons, spaces, and tabs from here to the end of the string

             // just truncate it

             str = str.substr(0, pos);

             pos = string::npos;

         } else {

             if (has_space) {

                 str = str.substr(0, pos + 1) + " " + str.substr(next_pos);

             } else {

                 str = str.substr(0, pos + 1) + str.substr(next_pos);

             }

             pos = NStr::Find (str, ";", pos + 1);

         }

     }

 }


 #define twocommas ((',') << 8 | (','))

 #define twospaces ((' ') << 8 | (' '))

 #define twosemicolons ((';') << 8 | (';'))

 #define space_comma ((' ') << 8 | (','))

 #define space_bracket ((' ') << 8 | (')'))

 #define bracket_space (('(') << 8 | (' '))

 #define space_semicolon ((' ') << 8 | (';'))

 #define comma_space ((',') << 8 | (' '))

 #define semicolon_space ((';') << 8 | (' '))


 bool Asn2gnbkCompressSpaces(string& val)

 {

     if (val.length() == 0) return false;


     char * str = new char[sizeof(char) * (val.length() + 1)];

     strcpy(str, val.c_str());


     char     ch;

     char *   dst;

     char *   ptr;


     char     curr;

     char     next;

     char *   in;

     char *   out;

     unsigned short   two_chars;


     in = str;

     out = str;


     curr = *in;

     in++;


     two_chars = curr;


     while (curr != '\0') {

         next = *in;

         in++;


         two_chars = (two_chars << 8) | next;


         if (two_chars == twocommas) {

             *out++ = curr;

             next = ' ';

             two_chars = next;

         }

         else if (two_chars == twospaces) {

         }

         else if (two_chars == twosemicolons) {

         }

         else if (two_chars == bracket_space) {

             next = curr;

             two_chars = curr;

         }

         else if (two_chars == space_bracket) {

         }

         else if (two_chars == space_comma) {

             *out++ = next;

             next = curr;

             *out++ = ' ';

             while (next == ' ' || next == ',') {

                 next = *in;

                 in++;

             }

             two_chars = next;

         }

         else if (two_chars == space_semicolon) {

             *out++ = next;

             next = curr;

             *out++ = ' ';

             while (next == ' ' || next == ';') {

                 next = *in;

                 in++;

             }

             two_chars = next;

         }

         else if (two_chars == comma_space) {

             *out++ = curr;

             *out++ = ' ';

             while (next == ' ' || next == ',') {

                 next = *in;

                 in++;

             }

             two_chars = next;

         }

         else if (two_chars == semicolon_space) {

             *out++ = curr;

             *out++ = ' ';

             while (next == ' ' || next == ';') {

                 next = *in;

                 in++;

             }

             two_chars = next;

         }

         else {

             *out++ = curr;

         }


         curr = next;

     }


     *out = '\0';


     /* TrimSpacesAroundString but allow leading/trailing tabs/newlines */


     if (str[0] != '\0') {

         dst = str;

         ptr = str;

         ch = *ptr;

         while (ch == ' ') {

             ptr++;

             ch = *ptr;

         }

         while (ch != '\0') {

             *dst = ch;

             dst++;

             ptr++;

             ch = *ptr;

         }

         *dst = '\0';

         dst = nullptr;

         ptr = str;

         ch = *ptr;

         while (ch != '\0') {

             if (ch != ' ') {

                 dst = nullptr;

             }

             else if (!dst) {

                 dst = ptr;

             }

             ptr++;

             ch = *ptr;

         }

         if (dst) {

             *dst = '\0';

         }

     }

     string new_val;

     new_val = str;

     delete[] str;


     if (!NStr::Equal(val, new_val)) {

 #ifdef _DEBUG

 #if 0

         printf("Use new string\n");

 #endif

 #endif

         val = new_val;

         return true;

     }

     else {

         return false;

     }

 }


 bool TrimSpacesSemicolonsAndCommas(string& val)

 {

     if (val.length() == 0) return false;


     char * str = new char[sizeof(char) * (val.length() + 1)];

     strcpy(str, val.c_str());


     char *  amp;

     unsigned char    ch;    /* to use 8bit characters in multibyte languages */

     char *  dst;

     char *  ptr;


     dst = str;

     ptr = str;

     ch = *ptr;

     if (ch != '\0' && (ch <= ' ' || ch == ';' || ch == ',')) {

         while (ch != '\0' && (ch <= ' ' || ch == ';' || ch == ',')) {

             ptr++;

             ch = *ptr;

         }

         while (ch != '\0') {

             *dst = ch;

             dst++;

             ptr++;

             ch = *ptr;

         }

         *dst = '\0';

     }

     amp = nullptr;

     dst = nullptr;

     ptr = str;

     ch = *ptr;

     while (ch != '\0') {

         if (ch == '&') {

             amp = ptr;

             dst = nullptr;

         }

         else if (ch <= ' ') {

             if (!dst) {

                 dst = ptr;

             }

             amp = nullptr;

         }

         else if (ch == ';') {

             if (!dst && !amp) {

                 dst = ptr;

             }

         }

         else if (ch == ',') {

             if (!dst) {

                 dst = ptr;

             }

             amp = nullptr;

         }

         else {

             dst = nullptr;

         }

         ptr++;

         ch = *ptr;

     }

     if (dst) {

         *dst = '\0';

     }


     string new_val;

     new_val = str;

     delete[] str;


     if (!NStr::Equal(val, new_val)) {

 #ifdef _DEBUG

 #if 0

         printf("Use new string\n");

 #endif

 #endif

         val = new_val;

         return true;

     }

     else {

         return false;

     }

 }


 bool RemoveSpaces(string& str)

 {

     if (str.empty()) {

         return false;

     }


     size_t next = 0;


     NON_CONST_ITERATE(string, it, str) {

         if (!isspace((unsigned char)(*it))) {

             str[next++] = *it;

         }

     }

     if (next < str.length()) {

         str.resize(next);

         return true;

     }

     return false;

 }


 class CGetSeqLocFromStringHelper_ReadLocFromText : public CGetSeqLocFromStringHelper {

 public:

     CGetSeqLocFromStringHelper_ReadLocFromText( CScope *scope )

         : m_scope(scope) { }


     virtual CRef<CSeq_loc> Seq_loc_Add(

         const CSeq_loc&    loc1,

         const CSeq_loc&    loc2,

         CSeq_loc::TOpFlags flags )

     {

         return sequence::Seq_loc_Add( loc1, loc2, flags, m_scope );

     }


 private:

     CScope *m_scope;

 };


 CRef<CSeq_loc> ReadLocFromText(const string& text, const CSeq_id *id, CScope *scope)

 {

     CGetSeqLocFromStringHelper_ReadLocFromText helper(scope);

     return GetSeqLocFromString(text, id, &helper);

 }


 typedef struct proteinabbrev {

      string abbreviation;

     char letter;

 } ProteinAbbrevData;


 static ProteinAbbrevData abbreviation_list[] =

 {

     {"Ala", 'A'},

     {"Asx", 'B'},

     {"Cys", 'C'},

     {"Asp", 'D'},

     {"Glu", 'E'},

     {"Phe", 'F'},

     {"Gly", 'G'},

     {"His", 'H'},

     {"Ile", 'I'},

     {"Xle", 'J'},  /* was - notice no 'J', breaks naive meaning of index -Karl */

     {"Lys", 'K'},

     {"Leu", 'L'},

     {"Met", 'M'},

     {"Asn", 'N'},

     {"Pyl", 'O'},  /* was - no 'O' */

     {"Pro", 'P'},

     {"Gln", 'Q'},

     {"Arg", 'R'},

     {"Ser", 'S'},

     {"Thr", 'T'},

     {"Val", 'V'},

     {"Trp", 'W'},

     {"Sec", 'U'}, /* was - not in iupacaa */

     {"Xxx", 'X'},

     {"Tyr", 'Y'},

     {"Glx", 'Z'},

     {"TERM", '*'}, /* not in iupacaa */ /*changed by Tatiana 06.07.95?`*/

     {"OTHER", 'X'}

 };


 // Find the single-letter abbreviation for either the single letter abbreviation

 // or three-letter abbreviation.

 // Use X if the abbreviation is not found.


 char x_ValidAminoAcid(string_view abbrev)

 {

     if (abbrev.length() >= 3) {

         for (unsigned k = 0; k < ArraySize(abbreviation_list); ++k) {

             if (NStr::EqualNocase(abbrev, abbreviation_list[k].abbreviation)) {

                 return abbreviation_list[k].letter;

             }

         }

     }


     if (abbrev.length() == 1) {

         for (unsigned k = 0; k < ArraySize(abbreviation_list); ++k) {

             if (abbrev[0] == abbreviation_list[k].letter) {

                 return abbreviation_list[k].letter;

             }

         }

     }


     return 'X';

 }


 bool s_DbtagCompare (const CRef<CDbtag>& dbt1, const CRef<CDbtag>& dbt2)

 {

     // is dbt1 < dbt2

     return dbt1->Compare(*dbt2) < 0;

 }


 bool s_DbtagEqual (const CRef<CDbtag>& dbt1, const CRef<CDbtag>& dbt2)

 {

     // is dbt1 == dbt2

     return dbt1->Compare(*dbt2) == 0;

 }


 bool s_OrgrefSynCompare( const string & syn1, const string & syn2 )

 {

     return NStr::CompareNocase(syn1, syn2) < 0;

 }


 bool s_OrgrefSynEqual( const string & syn1, const string & syn2 )

 {

     return NStr::EqualNocase(syn1, syn2);

 }


 END_SCOPE(objects)

 END_NCBI_SCOPE

Affil.hpp

Auth_list.hpp

Cit_gen.hpp

Cit_sub.hpp

Date.hpp

Imprint.hpp
User-defined methods of the data storage class.

MolInfo.hpp

Name_std.hpp

Org_ref.hpp

Person_id.hpp

Pub.hpp

Pub_equiv.hpp

Pubdesc.hpp

Seqdesc.hpp

CDbtag::Compare
int Compare(const CDbtag &dbt2) const
Definition: Dbtag.cpp:176

CGetSeqLocFromStringHelper_ReadLocFromText
Definition: asn2flat.cpp:1125

CGetSeqLocFromStringHelper_ReadLocFromText::CGetSeqLocFromStringHelper_ReadLocFromText
CGetSeqLocFromStringHelper_ReadLocFromText(CScope *scope)
Definition: cleanup_utils.cpp:570

CGetSeqLocFromStringHelper_ReadLocFromText::Seq_loc_Add
virtual CRef< CSeq_loc > Seq_loc_Add(const CSeq_loc &loc1, const CSeq_loc &loc2, CSeq_loc::TOpFlags flags)
Definition: cleanup_utils.cpp:573

CGetSeqLocFromStringHelper
Definition: seq_loc_from_string.hpp:46

CRef< CSeq_loc >

CScope
CScope –.
Definition: scope.hpp:92

CSeq_id
Definition: Seq_id.hpp:71

cleanup_pub.hpp

RemoveSpacesBetweenTildes
bool RemoveSpacesBetweenTildes(string &str)
remove white space between pairs of tildes.
Definition: cleanup_utils.cpp:229

CleanDoubleQuote
bool CleanDoubleQuote(string &str)
Change double to single quotes.
Definition: cleanup_utils.cpp:263

CleanVisString
bool CleanVisString(string &str)
Definition: cleanup_utils.cpp:71

comma_space
#define comma_space
Definition: cleanup_utils.cpp:316

space_comma
#define space_comma
Definition: cleanup_utils.cpp:312

space_semicolon
#define space_semicolon
Definition: cleanup_utils.cpp:315

ReadLocFromText
CRef< CSeq_loc > ReadLocFromText(const string &text, const CSeq_id *id, CScope *scope)
Definition: cleanup_utils.cpp:585

s_OrgrefSynCompare
bool s_OrgrefSynCompare(const string &syn1, const string &syn2)
Definition: cleanup_utils.cpp:667

s_DbtagEqual
bool s_DbtagEqual(const CRef< CDbtag > &dbt1, const CRef< CDbtag > &dbt2)
Definition: cleanup_utils.cpp:661

TrimInternalSemicolons
void TrimInternalSemicolons(string &str)
remove duplicate internal semicolons.
Definition: cleanup_utils.cpp:276

s_DbtagCompare
bool s_DbtagCompare(const CRef< CDbtag > &dbt1, const CRef< CDbtag > &dbt2)
Definition: cleanup_utils.cpp:654

semicolon_space
#define semicolon_space
Definition: cleanup_utils.cpp:317

x_ValidAminoAcid
char x_ValidAminoAcid(string_view abbrev)
Definition: cleanup_utils.cpp:632

bracket_space
#define bracket_space
Definition: cleanup_utils.cpp:314

s_OrgrefSynEqual
bool s_OrgrefSynEqual(const string &syn1, const string &syn2)
Definition: cleanup_utils.cpp:672

ProteinAbbrevData
struct proteinabbrev ProteinAbbrevData

abbreviation_list
static ProteinAbbrevData abbreviation_list[]
Definition: cleanup_utils.cpp:596

RemoveSpaces
bool RemoveSpaces(string &str)
remove all spaces from a string
Definition: cleanup_utils.cpp:548

twocommas
#define twocommas
Definition: cleanup_utils.cpp:309

twosemicolons
#define twosemicolons
Definition: cleanup_utils.cpp:311

space_bracket
#define space_bracket
Definition: cleanup_utils.cpp:313

CleanVisStringJunk
bool CleanVisStringJunk(string &str, bool allow_ellipses)
Definition: cleanup_utils.cpp:140

twospaces
#define twospaces
Definition: cleanup_utils.cpp:310

Asn2gnbkCompressSpaces
bool Asn2gnbkCompressSpaces(string &val)
weird space compression from C Toolkit
Definition: cleanup_utils.cpp:319

TrimSpacesSemicolonsAndCommas
bool TrimSpacesSemicolonsAndCommas(string &val)
Definition: cleanup_utils.cpp:465

cleanup_utils.hpp

ncbistd.hpp
Include a standard set of the NCBI C++ Toolkit most basic headers.

flags
static uch flags
Definition: ct_nlmzip_trees.cpp:342

out
std::ofstream out("events_result.xml")
main entry point for tests

next
static DLIST_TYPE *DLIST_NAME() next(DLIST_LIST_TYPE *list, DLIST_TYPE *item)
Definition: dlist.tmpl.h:56

str
static const char * str(char *buf, int n)
Definition: stats.c:84

ArraySize
constexpr size_t ArraySize(const Element(&)[Size])
Definition: ncbimisc.hpp:1532

NON_CONST_ITERATE
#define NON_CONST_ITERATE(Type, Var, Cont)
Non constant version of ITERATE macro.
Definition: ncbimisc.hpp:822

CSeq_loc::TOpFlags
int TOpFlags
Definition: Seq_loc.hpp:336

Seq_loc_Add
CRef< CSeq_loc > Seq_loc_Add(const CSeq_loc &loc1, const CSeq_loc &loc2, CSeq_loc::TOpFlags flags, CScope *scope)
Add two seq-locs.
Definition: seq_loc_util.cpp:2107

END_NCBI_SCOPE
#define END_NCBI_SCOPE
End previously defined NCBI scope.
Definition: ncbistl.hpp:103

END_SCOPE
#define END_SCOPE(ns)
End the previously defined scope.
Definition: ncbistl.hpp:75

BEGIN_NCBI_SCOPE
#define BEGIN_NCBI_SCOPE
Define ncbi namespace.
Definition: ncbistl.hpp:100

BEGIN_SCOPE
#define BEGIN_SCOPE(ns)
Define a new scope.
Definition: ncbistl.hpp:72

SIZE_TYPE
NCBI_NS_STD::string::size_type SIZE_TYPE
Definition: ncbistr.hpp:132

NStr::CompareNocase
static int CompareNocase(const CTempString s1, SIZE_TYPE pos, SIZE_TYPE n, const char *s2)
Case-insensitive compare of a substring with another string.
Definition: ncbistr.cpp:219

NPOS
#define NPOS
Definition: ncbistr.hpp:133

NStr::Find
static SIZE_TYPE Find(const CTempString str, const CTempString pattern, ECase use_case=eCase, EDirection direction=eForwardSearch, SIZE_TYPE occurrence=0)
Find the pattern in the string.
Definition: ncbistr.cpp:2882

NStr::EqualNocase
static bool EqualNocase(const CTempString s1, SIZE_TYPE pos, SIZE_TYPE n, const char *s2)
Case-insensitive equality of a substring with another string.
Definition: ncbistr.hpp:5347

NStr::Equal
static bool Equal(const CTempString s1, SIZE_TYPE pos, SIZE_TYPE n, const char *s2, ECase use_case=eCase)
Test for equality of a substring with another string.
Definition: ncbistr.hpp:5378

int
unsigned int
A callback function used to compare two keys in a database.
Definition: types.hpp:1210

text
static void text(MDB_val *v)
Definition: mdb_dump.c:62

objects
Definition: wiggle_export_job.hpp:44

ncbi_pch.hpp

isspace
int isspace(Uchar c)
Definition: ncbictype.hpp:69

in
std::istream & in(std::istream &in_, double &x_)

copy
void copy(Njn::Matrix< S > *matrix_, const Njn::Matrix< T > &matrix0_)
Definition: njn_matrix.hpp:613

Author.hpp

seq_loc_from_string.hpp

GetSeqLocFromString
CRef< CSeq_loc > GetSeqLocFromString(const string &text, const CSeq_id *id, CGetSeqLocFromStringHelper *helper)
Definition: seq_loc_from_string.cpp:579

seq_loc_util.hpp

seqdesc_ci.hpp

sequence.hpp

sequence_macros.hpp

proteinabbrev
Definition: cleanup_utils.cpp:591

proteinabbrev::abbreviation
string abbreviation
Definition: cleanup_utils.cpp:592

proteinabbrev::letter
char letter
Definition: cleanup_utils.cpp:593

eFiles::val
@ val

_ASSERT
#define _ASSERT
Definition: test_assert_impl.h:173

letter
static Uint4 letter(char c)
Definition: win_mask_gen_counts.cpp:62