#include <objtools/readers/message_listener.hpp>
#include <misc/data_loaders_util/data_loaders_util.hpp>
#include <util/format_guess.hpp>
#include "table2asn_context.hpp"
#include "async_token.hpp"
#include "multireader.hpp"
BEGIN_NCBI_SCOPE
using namespace objects;
class CSerialObject;
class CTable2AsnLogger;
class CMultiReader;
class CTable2AsnValidator;
class CMask;
class CTable2AsnStructuredCommentsReader;
class CFeatureTableReader;
class CMemorySrcFileMap;
namespace objects::edit {
class CHugeFile;
}
namespace objects::feature {
class CFeatTree;
}
class CTbl2AsnApp : public CNcbiApplication
{
public:
CTbl2AsnApp();
void Init() override;
int Run() override;
int DryRun() override
{
return Run();
}
using TAnnotMap = CMultiReader::TAnnotMap;
private:
static const CDataLoadersUtil::TLoaders default_loaders = CDataLoadersUtil::fGenbank | CDataLoadersUtil::fVDB | CDataLoadersUtil::fGenbankOffByDefault | CDataLoadersUtil::fSRA;
void Setup(const CArgs& args);
void ProcessOneFile(bool isAlignment, bool manageDiagnosticStreams = true, bool manageDataStream=true);
void ProcessOneFile(CNcbiOstream* output);
void xProcessOneFile(CFormatGuess::EFormat format,
CRef<CSerialObject> pInputObject,
TAnnotMap& annotMap,
CNcbiOstream* output);
void ProcessHugeFile(edit::CHugeFile& hugeFile, CNcbiOstream* output);
void ProcessOneFile(CFormatGuess::EFormat format, const string& contentType, unique_ptr<CNcbiIstream>& pIstr, CNcbiOstream* output);
void ProcessOneEntry(CFormatGuess::EFormat inputFormat, CRef<CSerialObject> obj, CRef<CSerialObject>& result);
void ProcessSingleEntry(CFormatGuess::EFormat inputFormat, TAsyncToken& token);
void MakeFlatFile(CSeq_entry_Handle seh, CRef<CSeq_submit> submit, std::ostream& ostream);
void ProcessTopEntry(CFormatGuess::EFormat inputFormat, bool need_update_date, CRef<CSeq_submit>& submit, CRef<CSeq_entry>& entry);
bool ProcessOneDirectory(const CDir& directory, const CMask& mask, bool recurse);
void ProcessAlignmentFile(CNcbiOstream* output);
void ReportUnusedSourceQuals();
void xProcessSecretFiles1Phase(bool readModsFromTitle, CSeq_entry& result);
void ProcessSecretFiles1Phase(bool readModsFromTitle, TAsyncToken&);
void ProcessSecretFiles2Phase(CSeq_entry& result) const;
void ProcessCMTFiles(CSeq_entry& result) const;
void LoadPEPFile(const string& pathname);
void LoadRNAFile(const string& pathname);
void LoadPRTFile(const string& pathname);
void LoadDSCFile(const string& pathname);
void LoadAdditionalFiles();
void LoadCMTFile(const string& pathname, unique_ptr<CTable2AsnStructuredCommentsReader>& comments);
void LoadAnnotMap(const string& pathname, TAnnotMap& annotMap);
void AddAnnots(CSeq_entry& entry);
void SetupAndOpenDiagnosticStreams();
void SetupAndOpenDataStreams();
void CloseDiagnosticStreams();
void CloseDataStreams();
void xProcessHugeEntries();
size_t xGetNumThreads() const;
void x_SetAlnArgs(CArgDescriptions& arg_desc);
struct TAdditionalFiles
{
unique_ptr<CTable2AsnStructuredCommentsReader> m_struct_comments;
CMultiReader::TAnnotMap m_AnnotMap;
set<string> m_MatchedAnnots;
CRef<CSeq_entry> m_replacement_proteins;
CRef<CSeq_entry> m_possible_proteins;
CRef<CSeq_descr> m_descriptors;
unique_ptr<CMemorySrcFileMap> mp_src_qual_map;
unique_ptr<CFeatureTableReader> m_feature_table_reader;
};
TAdditionalFiles m_global_files;
unique_ptr<TAdditionalFiles> m_secret_files;
unique_ptr<CMultiReader> m_reader;
CRef<CTable2AsnValidator> m_validator;
CRef<CTable2AsnLogger> m_logger;
CTable2AsnContext m_context;
static const Int8 TBL2ASN_MAX_ALLOWED_FASTA_SIZE = INT8_C(0x7FFFFFFF);
};
class CTable2AsnLogger : public CMessageListenerLenient, public CDiagHandler
{
public:
CTable2AsnLogger() : m_enable_log(false) {}
bool m_enable_log;
void PutProgress(
const string& sMessage,
const Uint8 iNumDone = 0,
const Uint8 iNumTotal = 0) override;
bool PutMessage(const IObjtoolsMessage& message) override;
void Post(const SDiagMessage& mess) override;
};
END_NCBI_SCOPE
0001
0002
0003
0004
0005
0006
0007
0008
0009
0010
0011
0012
0013
0014
0015
0016
0017
0018
0019
0020
0021
0022
0023
0024
0025
0026
0027
0028
0029
0030
0031
0032
0033
0034
0035
0036
0037
0038
0039
0040
0041
0042
0043
0044
0045
0046
0047
0048
0049
0050
0051
0052
0053
0054
0055
0056
0057
0058
0059
0060
0061
0062
0063
0064
0065
0066
0067
0068
0069
0070
0071
0072
0073
0074
0075
0076
0077
0078
0079
0080
0081
0082
0083
0084
0085
0086
0087
0088
0089
0090
0091
0092
0093
0094
0095
0096
0097
0098
0099
0100
0101
0102
0103
0104
0105
0106
0107
0108
0109
0110
0111
0112
0113
0114
0115
0116
0117
0118
0119
0120
0121
0122
0123
0124
0125
0126
0127
0128
0129
0130
0131
0132
0133
0134
0135
0136
0137
0138
0139
0140
0141
0142
0143
0144
0145
0146
0147
0148
0149
0150
0151
0152
0153
0154
0155
0156
0157
0158
0159
0160
0161
0162