prosite_search.cpp
来自「ncbi源码」· C++ 代码 · 共 374 行
CPP
374 行
/* * =========================================================================== * PRODUCTION $Log: prosite_search.cpp,v $ * PRODUCTION Revision 1000.6 2004/06/01 20:55:39 gouriano * PRODUCTION PRODUCTION: UPGRADED [GCC34_MSVC7] Dev-tree R1.23 * PRODUCTION * =========================================================================== *//* $Id: prosite_search.cpp,v 1000.6 2004/06/01 20:55:39 gouriano Exp $ * =========================================================================== * * PUBLIC DOMAIN NOTICE * National Center for Biotechnology Information * * This software/database is a "United States Government Work" under the * terms of the United States Copyright Act. It was written as part of * the author's official duties as a United States Government employee and * thus cannot be copyrighted. This software/database is freely available * to the public for use. The National Library of Medicine and the U.S. * Government have not placed any restriction on its use or reproduction. * * Although all reasonable efforts have been taken to ensure the accuracy * and reliability of the software and data, the NLM and the U.S. * Government do not and cannot warrant the performance or results that * may be obtained by using this software or data. The NLM and the U.S. * Government disclaim all warranties, express or implied, including * warranties of performance, merchantability or fitness for any particular * purpose. * * Please cite the author in any work or product based on this material. * * =========================================================================== * * Authors: Josh Cherry * * File Description: gbench plugin for searching against prosite patterns * */#include <ncbi_pch.hpp>#include "prosite_search.hpp"#include "prosite.hpp"#include <algo/sequence/find_pattern.hpp>#include <corelib/ncbiapp.hpp>#include <corelib/ncbireg.hpp>#include <gui/core/plugin_utils.hpp>#include <gui/utils/system_path.hpp>#include <gui/core/version.hpp>#include <gui/dialogs/col/multi_col_dlg.hpp>#include <gui/plugin/PluginCommandSet.hpp>#include <gui/plugin/PluginInfo.hpp>#include <gui/plugin/PluginRequest.hpp>#include <gui/plugin/PluginValueConstraint.hpp>#include <gui/utils/message_box.hpp>#include <gui/objutils/utils.hpp>#include <objects/seqloc/Seq_interval.hpp>#include <objmgr/seq_vector.hpp>#include <objmgr/util/sequence.hpp>BEGIN_NCBI_SCOPEUSING_SCOPE(objects);CAlgoPlugin_PrositeSearch::~CAlgoPlugin_PrositeSearch(){}// standard plugin announce bopilerplatevoid CAlgoPlugin_PrositeSearch::GetInfo(CPluginInfo& info){ info.Reset(); // version info macro info.SetInfo(CPluginVersion::eMajor, CPluginVersion::eMinor, 0, string(__DATE__) + " " + string(__TIME__), "CAlgoPlugin_PrositeSearch", "Search/Search against prosite", "Search a protein sequence against prosite patterns", ""); // command info CPluginCommandSet& cmds = info.SetCommands(); CPluginCommand& args = cmds.AddAlgoCommand(eAlgoCommand_run); args.AddArgument("locs", "Locations to evaluate", CSeq_loc::GetTypeInfo(), CPluginArg::TData::e_Array); args.SetConstraint("locs", (*CPluginValueConstraint::CreateSeqMol(), CSeq_inst::eMol_aa)); args.AddDefaultArgument("skip", "Skip patterns with SKIP_FLAG set", CPluginArg::eBoolean, "true");}void CAlgoPlugin_PrositeSearch::RunCommand(CPluginMessage& msg){ const CPluginCommand& args = msg.GetRequest().GetCommand(); CPluginReply& reply = msg.SetReply(); _TRACE("CAlgoPlugin_PrositeSearch::RunCommand()"); bool skip = args["skip"].AsBoolean(); // load patterns from file vector<CPrositeEntry> entries; try { x_LoadPrositeData(entries); } catch (const exception& e) { NcbiMessageBox(e.what()); reply.SetStatus(eMessageStatus_failed); return; } if ( !m_Dialog.get() ) { m_Dialog.reset(new CMultiColDlg()); m_Dialog->SetWindowSize(1000, 350); m_Dialog->SetTitle("Pattern Search Results"); m_Dialog->SetColumn(0, "Sequence", FL_ALIGN_LEFT, 1.0f); m_Dialog->SetColumn(1, "Location", FL_ALIGN_LEFT, 1.0f); m_Dialog->SetColumn(2, "Position", FL_ALIGN_CENTER, 1.0f); m_Dialog->SetColumn(3, "Pattern ID", FL_ALIGN_LEFT, 3.0f); m_Dialog->SetColumn(4, "Pattern Description", FL_ALIGN_LEFT, 4.0f); m_Dialog->SetColumn(5, "Pattern", FL_ALIGN_LEFT, 3.0f); m_Dialog->SetColumn(6, "Matched Sequence", FL_ALIGN_LEFT, 2.0f); } m_Dialog->SetRows(0); // to clear any previous contents vector<TSeqPos> starts; vector<TSeqPos> ends; // // first, evaluate whole sequences // int row = 0; plugin_args::TLocList locs; GetArgValue(args["locs"], locs); unsigned int patterns_searched; ITERATE (plugin_args::TLocList, iter, locs) { const CSeq_loc& loc = *iter->second; const IDocument& doc = *iter->first; // find the best ID for this bioseq try { CBioseq_Handle handle = doc.GetScope().GetBioseqHandle(loc); CSeqVector vec = handle.GetSequenceView(loc, CBioseq_Handle::eViewConstructed, CBioseq_Handle::eCoding_Iupac); string seq; vec.GetSeqData( (TSeqPos) 0, vec.size(), seq ); string& id_str = m_Dialog->SetCell(row, 0); string& loc_str = m_Dialog->SetCell(row, 1); const CSeq_id& best_id = sequence::GetId(handle, sequence::eGetId_Best); id_str.erase(); best_id.GetLabel(&id_str); loc_str = CPluginUtils::GetLabel(loc, &doc.GetScope()); // a new feature table CRef<CSeq_annot> annot(new CSeq_annot()); patterns_searched = 0; // iterate over patterns ITERATE (vector<CPrositeEntry>, entry, entries) { if (entry->GetSkipFlag() && skip) { continue; // skip this pattern entry } string pcre = CProsite::PSPatternToPCRE(entry->GetPattern()); CFindPattern::Find(seq, pcre, starts, ends); patterns_searched++; for( unsigned int k = 0; k < starts.size(); k++) { string& pos_str = m_Dialog->SetCell(row, 2); // 1-based indexing for dialog pos_str = NStr::IntToString(starts[k] + 1) + " - " + NStr::IntToString(ends[k] + 1); m_Dialog->SetCell(row, 3) = entry->GetId(); m_Dialog->SetCell(row, 4) = entry->GetDesc(); m_Dialog->SetCell(row, 5) = entry->GetPattern(); m_Dialog->SetCell(row, 6) = seq.substr(starts[k], ends[k] - starts[k] + 1); ++row; } // // add features to annot // for( unsigned int k = 0; k < starts.size(); k++) { // create feature CRef<CSeq_feat> feat(new CSeq_feat()); // set correct location CSeq_loc& floc = feat->SetLocation(); floc.SetInt().SetId().Assign(sequence::GetId(loc)); floc.SetInt().SetFrom(starts[k]); floc.SetInt().SetTo (ends[k]); feat->SetLocation (*CSeqUtils::RemapChildToParent(loc, floc)); // set feature data feat->SetData().SetRegion() = "Prosite match: " + entry->GetDesc() + "; " + entry->GetId(); // save in annot annot->SetData().SetFtable().push_back(feat); } } // add description to annot annot->SetName("Prosite matches"); // attach annot to doc //const_cast<IDocument&>(doc).AttachAnnot(*annot); reply.AddObject(doc, *annot); } catch (exception& e) { LOG_POST(Error << e.what()); string str = CPluginUtils::GetLabel(loc, &doc.GetScope()); LOG_POST(Error << "Error processing location " << str); }#ifndef _DEBUG catch (...) { string str = CPluginUtils::GetLabel(loc, &doc.GetScope()); LOG_POST(Error << "Error processing location " << str); }#endif } // update all views //CDocManager::UpdateAllViews(); // // prepare our dialog box // m_Dialog->SetLabel(string("A search against ") + NStr::IntToString(patterns_searched) + " patterns produced:"); m_Dialog->Show(); reply.SetStatus(eMessageStatus_success); reply.AddAction(CPluginReplyAction::e_Add_to_document);}void CAlgoPlugin_PrositeSearch::x_LoadPrositeData(vector<CPrositeEntry>& entries){ CNcbiApplication* app = CNcbiApplication::Instance(); _ASSERT(app); CNcbiRegistry& registry = app->GetConfig(); string fname; // By default the rebase "NAR format" file // is assumed to be <std>/etc/rebase.nar. // This can be overridden in gbench.ini, via the application registry // variable [PROSITE_SEARCH] PrositeData. fname = registry.GetString("PROSITE_SEARCH", "PrositeData", ""); if ( !fname.empty() ) { fname += ", "; } fname += "<home>/etc/prosite.dat, <std>/etc/prosite.dat"; fname = CSystemPath::ResolvePathExisting(fname); if ( fname.empty() ) { throw runtime_error("Couldn't open PROSITE file"); } ifstream psfile(fname.c_str()); CProsite::ReadEntries(psfile, entries);}END_NCBI_SCOPE/* * =========================================================================== * $Log: prosite_search.cpp,v $ * Revision 1000.6 2004/06/01 20:55:39 gouriano * PRODUCTION: UPGRADED [GCC34_MSVC7] Dev-tree R1.23 * * Revision 1.23 2004/05/21 22:27:47 gorelenk * Added PCH ncbi_pch.hpp * * Revision 1.22 2004/05/03 13:05:42 dicuccio * gui/utils --> gui/objutils where needed * * Revision 1.21 2004/03/05 17:35:37 dicuccio * Use sequence::GetId() instead of CSeq_id::GetStringDescr() * * Revision 1.20 2004/02/17 20:35:25 rsmith * moved core/settings.[ch]pp and core/system_path.[ch]pp to config and utils, respectively. * * Revision 1.19 2004/02/13 15:08:50 mjohnson * Removed local URL for plugin help. * * Revision 1.18 2004/01/27 18:38:08 dicuccio * Code clean-up. Use standard names for plugins. Removed unnecessary #includes * * Revision 1.17 2004/01/07 15:50:38 dicuccio * Adjusted for API change in CPluginUtils::GetLabel(). Standardized exception * reporting in algorithms. * * Revision 1.16 2003/12/15 20:16:08 jcherry * Changed CFindPattern::Find to take a string rather than a CSeqVector * * Revision 1.15 2003/11/24 15:45:28 dicuccio * Renamed CVersion to CPluginVersion * * Revision 1.14 2003/11/18 17:48:38 dicuccio * Added standard processing of return values * * Revision 1.13 2003/11/14 00:20:29 jcherry * Added url for help * * Revision 1.12 2003/11/06 20:12:12 dicuccio * Cleaned up handling of USING_SCOPE - removed from all headers * * Revision 1.11 2003/11/04 17:49:23 dicuccio * Changed calling parameters for plugins - pass CPluginMessage instead of paired * CPluginCommand/CPluginReply * * Revision 1.10 2003/10/27 17:46:49 dicuccio * Removed dead #includes * * Revision 1.9 2003/10/14 16:24:02 dicuccio * Added correct remapping of scanned locations to the parent location. Cleaned * up code to look for data file - added hierarchichal search through path in INI, * user's home directory, and finally system installed path. * * Revision 1.8 2003/10/07 13:47:00 dicuccio * Renamed CPluginURL* to CPluginValue* * * Revision 1.7 2003/09/25 17:21:35 jcherry * Added name to annot * * Revision 1.6 2003/09/04 14:05:24 dicuccio * Use IDocument instead of CDocument * * Revision 1.5 2003/09/03 14:46:53 rsmith * change namespace name from args to plugin_args to avoid clashes with variable names. * * Revision 1.4 2003/08/21 12:03:07 dicuccio * Make use of new typedef in plugin_utils.hpp for argument values. * * Revision 1.3 2003/08/15 18:48:06 jcherry * Brought dialog handling up to date. * * Revision 1.2 2003/08/11 18:03:25 jcherry * Fixed to use 0-based indexing for feature table (but retain * 1-based indexing for dialog box) * * Revision 1.1 2003/08/04 20:05:45 jcherry * Initial version * * =========================================================================== */
⌨️ 快捷键说明
复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?