This example is one of a few that shows how the CIFPARSE-OBJ library can be used to interface with Chimera, such that useful and interesting aspects of a molecule, e.g., certain connections among certain atoms, obtainable via parsing CIF files, can be located and used as the subject of a Chimera render or animation. This particular example shows how to retrieve and iterate over the struct_conn category, which delineates connections in a molecule, and locate connections of interest (in this case, covalent bonds) for Chimera to emphasize and animate. It is easy to extend this example, say, to handle a set of connection types of interest, each to be displayed in a different color in Chimera, or to focus on connection types of interest only among certain atoms of interest.
Save Connections.C to/path/to/cifparse-obj-vX.X-prod-src/parser-test-app-vX.X/src/
Save the CIF file anywhere, e.g.,/path/to/cifparse-obj-vX.X-prod-src/parser-test-app-vX.X/bin/
Add Connections.ext to the BASE_MAIN_FILES list in the Makefile in/path/to/cifparse-obj.vX.X-prod-src/parser-test-app-vX.X
Executemake
in the same directory as the Makefilecd
to bin, where the executable has been made, and run./Connections /path/to/5HVP.cif
, which generates a/path/to/5HVP.com
file which you can open withchimera /path/to/5HVP.com
Alternatively, you can save the script to/path/to/cifparse-obj-vX.X-prod-src/parser-test-app-vX.X/bin/
, set the Chimera path, and run./Connections.sh /path/to/5HVP.cif
, which will automate the process
#include "CifFile.h"
CifFile::GetBlockNames(vector<string>& blockNames)
. #include "ISTable.h"
/************************* * Connections.C * * For some CIF file, generate a Chimera command (COM) file * to iterate through and animate each interatomic covalent * connection in the molecule. * * Lines with superscriptions contain footnoted references or explanations. *************************/ #include <cstring> #include <fstream> #include <iostream> #include <map> #include <string> #include <vector> #include "CifFile.h" #include "CifParserBase.h" #include "ISTable.h" void prepareOutFile(std::ofstream& outFile, const string& cifFileName); void showUsage(); void writeConnection(std::ofstream& outFile, const string& select); int main(int argc, char **argv) { if (argc != 2) { showUsage(); } // The name of the CIF file string cifFileName = argv[1]; // A string to hold any parsing diagnostics string diagnostics; // Create CIF file and parser objects CifFile *cifFileP = new CifFile; CifParser *cifParserP = new CifParser(cifFileP); // Parse the CIF file cifParserP->Parse(cifFileName, diagnostics); // Delete the CIF parser, as it is no longer needed delete cifParserP; // Display any diagnostics if (!diagnostics.empty()) { std::cout << "Diagnostics: " << std::endl << diagnostics << std::endl; } // Get the first data block name in the CIF file string firstBlockName = cifFileP->GetFirstBlockName(); // Retrieve the first data block Block &block = cifFileP->GetBlock(firstBlockName); // Retrieve the table corresponding to the struct_conn category, which delineates connections1 ISTable& struct_conn = block.GetTable("struct_conn"); // Use the CIF file pathname to generate the Chimera command file (.COM) pathname size_t fileExtPos = cifFileName.find(".cif"); string outFileName = cifFileName.substr(0, fileExtPos) + ".com"; // Create the command file std::ofstream outFile; outFile.open(outFileName.c_str()); // Write out some basic Chimera initialization commands prepareOutFile(outFile, cifFileName); // Iterate through every row in the struct_conn category table, where each row delineates an interatomic connection for (unsigned int i = 0; i < struct_conn.GetNumRows(); ++i) { // Verify that the linkage is covalent, as indicated by the conn_type_id attribute2 if (struct_conn(i, "conn_type_id") != "covale") { continue; } // A Chimera selection string to build up for the two partner atoms string select; // Analyze the current row twice, once per partner for (unsigned int j = 0; j < 2; ++j) { // Determine which partner we are dealing with string partner = (!j) ? "ptnr1_" : "ptnr2_"; // Retrieve all the information necessary to uniquely identify that partner atom3 string alt_id = struct_conn(i, "pdbx_" + partner + "label_alt_id"); string asym_id = struct_conn(i, partner + "auth_asym_id"); string atom_id = struct_conn(i, partner + "label_atom_id"); string comp_id = struct_conn(i, partner + "auth_comp_id"); string seq_id = struct_conn(i, partner + "auth_seq_id"); // Add to the Chimera selection string for this atom4 select += ":" + seq_id + "," + comp_id + "." + asym_id + "@" + atom_id + "." + alt_id; // Add an OR to the selection string before partner 2 so that Chimera grabs both partner atoms if (!j) { select += " | "; } } // Write out commands for Chimera to customize the display of these connected atoms writeConnection(outFile, select); } // Write out the Chimera close command, as all connections have been processed outFile << "stop\n"; // Close the COM file outFile.close(); return 0; } void prepareOutFile(std::ofstream& outFile, const string& cifFileName) { outFile << "windowsize 500 500\n"; // Set the window size to 500 x 500 px outFile << "open " + cifFileName << std::endl; // Open the CIF file outFile << "preset apply pub 4\n"; // Apply publication preset #4 outFile << "color white\n"; // Color the entire molecule white outFile << "set bg_color gray\n"; // Color the background gray outFile << "repr bs\n"; // Represent the atoms in ball-and-stick format outFile << "savepos fullview\n"; // Remember this position (the full view of molecule) } void showUsage() { std::cout << "Usage: ./Connections /path/to/file.cif" << std::endl; exit(1); } // Write to the COM file a sequence of Chimera commands to be executed for every connection of interest void writeConnection(std::ofstream& outFile, const string& select) { outFile << "sel " + select << std::endl; // Select the two partner atoms outFile << "color byelement sel; label sel" << std::endl; // Color them using Chimera's color-by-element feature outFile << "sel sel za<3.0; wait 20\n"; // Further select all atoms within 3.0 angstroms of the partner atoms outFile << "focus sel; wait 25; ~disp ~sel; wait 68\n"; // Focus on the selection and hide all non-selected atoms outFile << "disp ~sel; ~label sel; reset fullview 20\n"; // Return to the full molecule view outFile << "color white sel; ~sel; wait 20\n"; // Uncolor and drop the selection }