This example is one of a few that shows how the CIFPARSE-OBJ library can be used to interface with Chimera, such that useful and interesting aspects of a molecule, e.g., certain connections among certain atoms, obtainable via parsing CIF files, can be located and used as the subject of a Chimera render or animation. This particular example shows how to retrieve and iterate over the struct_conn category, which delineates connections in a molecule, and locate connections of interest (in this case, covalent bonds) for Chimera to emphasize and animate. It is easy to extend this example, say, to handle a set of connection types of interest, each to be displayed in a different color in Chimera, or to focus on connection types of interest only among certain atoms of interest.
Save Connections.C to/path/to/cifparse-obj-vX.X-prod-src/parser-test-app-vX.X/src/Save the CIF file anywhere, e.g.,/path/to/cifparse-obj-vX.X-prod-src/parser-test-app-vX.X/bin/Add Connections.ext to the BASE_MAIN_FILES list in the Makefile in/path/to/cifparse-obj.vX.X-prod-src/parser-test-app-vX.XExecutemakein the same directory as the Makefilecdto bin, where the executable has been made, and run./Connections /path/to/5HVP.cif, which generates a/path/to/5HVP.comfile which you can open withchimera /path/to/5HVP.comAlternatively, you can save the script to/path/to/cifparse-obj-vX.X-prod-src/parser-test-app-vX.X/bin/, set the Chimera path, and run./Connections.sh /path/to/5HVP.cif, which will automate the process
#include "CifFile.h"
CifFile::GetBlockNames(vector<string>& blockNames). #include "ISTable.h"
/*************************
* Connections.C
*
* For some CIF file, generate a Chimera command (COM) file
* to iterate through and animate each interatomic covalent
* connection in the molecule.
*
* Lines with superscriptions contain footnoted references or explanations.
*************************/
#include <cstring>
#include <fstream>
#include <iostream>
#include <map>
#include <string>
#include <vector>
#include "CifFile.h"
#include "CifParserBase.h"
#include "ISTable.h"
void prepareOutFile(std::ofstream& outFile, const string& cifFileName);
void showUsage();
void writeConnection(std::ofstream& outFile, const string& select);
int main(int argc, char **argv)
{
if (argc != 2)
{
showUsage();
}
// The name of the CIF file
string cifFileName = argv[1];
// A string to hold any parsing diagnostics
string diagnostics;
// Create CIF file and parser objects
CifFile *cifFileP = new CifFile;
CifParser *cifParserP = new CifParser(cifFileP);
// Parse the CIF file
cifParserP->Parse(cifFileName, diagnostics);
// Delete the CIF parser, as it is no longer needed
delete cifParserP;
// Display any diagnostics
if (!diagnostics.empty())
{
std::cout << "Diagnostics: " << std::endl << diagnostics << std::endl;
}
// Get the first data block name in the CIF file
string firstBlockName = cifFileP->GetFirstBlockName();
// Retrieve the first data block
Block &block = cifFileP->GetBlock(firstBlockName);
// Retrieve the table corresponding to the struct_conn category, which delineates connections1
ISTable& struct_conn = block.GetTable("struct_conn");
// Use the CIF file pathname to generate the Chimera command file (.COM) pathname
size_t fileExtPos = cifFileName.find(".cif");
string outFileName = cifFileName.substr(0, fileExtPos) + ".com";
// Create the command file
std::ofstream outFile;
outFile.open(outFileName.c_str());
// Write out some basic Chimera initialization commands
prepareOutFile(outFile, cifFileName);
// Iterate through every row in the struct_conn category table, where each row delineates an interatomic connection
for (unsigned int i = 0; i < struct_conn.GetNumRows(); ++i)
{
// Verify that the linkage is covalent, as indicated by the conn_type_id attribute2
if (struct_conn(i, "conn_type_id") != "covale")
{
continue;
}
// A Chimera selection string to build up for the two partner atoms
string select;
// Analyze the current row twice, once per partner
for (unsigned int j = 0; j < 2; ++j)
{
// Determine which partner we are dealing with
string partner = (!j) ? "ptnr1_" : "ptnr2_";
// Retrieve all the information necessary to uniquely identify that partner atom3
string alt_id = struct_conn(i, "pdbx_" + partner + "label_alt_id");
string asym_id = struct_conn(i, partner + "auth_asym_id");
string atom_id = struct_conn(i, partner + "label_atom_id");
string comp_id = struct_conn(i, partner + "auth_comp_id");
string seq_id = struct_conn(i, partner + "auth_seq_id");
// Add to the Chimera selection string for this atom4
select += ":" + seq_id + "," + comp_id + "." + asym_id + "@" + atom_id + "." + alt_id;
// Add an OR to the selection string before partner 2 so that Chimera grabs both partner atoms
if (!j)
{
select += " | ";
}
}
// Write out commands for Chimera to customize the display of these connected atoms
writeConnection(outFile, select);
}
// Write out the Chimera close command, as all connections have been processed
outFile << "stop\n";
// Close the COM file
outFile.close();
return 0;
}
void prepareOutFile(std::ofstream& outFile, const string& cifFileName)
{
outFile << "windowsize 500 500\n"; // Set the window size to 500 x 500 px
outFile << "open " + cifFileName << std::endl; // Open the CIF file
outFile << "preset apply pub 4\n"; // Apply publication preset #4
outFile << "color white\n"; // Color the entire molecule white
outFile << "set bg_color gray\n"; // Color the background gray
outFile << "repr bs\n"; // Represent the atoms in ball-and-stick format
outFile << "savepos fullview\n"; // Remember this position (the full view of molecule)
}
void showUsage()
{
std::cout << "Usage: ./Connections /path/to/file.cif" << std::endl;
exit(1);
}
// Write to the COM file a sequence of Chimera commands to be executed for every connection of interest
void writeConnection(std::ofstream& outFile, const string& select)
{
outFile << "sel " + select << std::endl; // Select the two partner atoms
outFile << "color byelement sel; label sel" << std::endl; // Color them using Chimera's color-by-element feature
outFile << "sel sel za<3.0; wait 20\n"; // Further select all atoms within 3.0 angstroms of the partner atoms
outFile << "focus sel; wait 25; ~disp ~sel; wait 68\n"; // Focus on the selection and hide all non-selected atoms
outFile << "disp ~sel; ~label sel; reset fullview 20\n"; // Return to the full molecule view
outFile << "color white sel; ~sel; wait 20\n"; // Uncolor and drop the selection
}