1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546 547 548 549 550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615
|
/**********************************************************************
main.cpp - Main conversion program, command-line handling.
Copyright (C) 1998-2001 by OpenEye Scientific Software, Inc.
Some portions Copyright (C) 2001-2006 by Geoffrey R. Hutchison
Some portions Copyright (C) 2004-2006 by Chris Morley
This file is part of the Open Babel project.
For more information, see <http://openbabel.sourceforge.net/>
This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation version 2 of the License.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
***********************************************************************/
// used to set import/export for Cygwin DLLs
#ifdef WIN32
#define USING_OBDLL
#endif
#include <openbabel/babelconfig.h>
#include <iostream>
#include <fstream>
#include <sstream>
#include <string>
#include <map>
#if HAVE_CONIO_H
#include <conio.h>
#endif
#if !HAVE_STRNCASECMP
extern "C" int strncasecmp(const char *s1, const char *s2, size_t n);
#endif
#include <openbabel/obconversion.h>
#include <openbabel/plugin.h>
#include <cstdlib>
#include <cstring>
using namespace std;
using namespace OpenBabel;
void DoOption(const char* p, OBConversion& Conv, OBConversion::Option_type typ,
int& arg, int argc, char *argv[]);
void usage();
void help();
// There isn't a great way to do this -- we need to save argv[0] for usage()
static char *program_name;
int main(int argc,char *argv[])
{
OBConversion Conv(&cin, &cout); //default input and output are console
OBFormat* pInFormat = NULL;
OBFormat* pOutFormat = NULL;
vector<string> FileList, OutputFileList;
string OutputFileName;
// Parse commandline
bool gotInType = false, gotOutType = false;
bool SplitOrBatch=false;
char *oext = NULL;
char *iext = NULL;
//Save name of program without its path (and .exe)
string pn(argv[0]);
string::size_type pos;
#ifdef _WIN32
pos = pn.find(".exe");
if(pos!=string::npos)
argv[0][pos]='\0';
#endif
pos = pn.find_last_of("/\\");
if(pos==string::npos)
program_name=argv[0];
else
program_name=argv[0]+pos+1;
const char* p;
int arg;
for (arg = 1; arg < argc; ++arg)
{
if (argv[arg])
{
if (argv[arg][0] == '-')
{
switch (argv[arg][1])
{
case 'V':
{
cout << "Open Babel " << BABEL_VERSION << " -- "
<< __DATE__ << " -- " << __TIME__ << endl;
exit(0);
}
case 'i':
gotInType = true;
iext = argv[arg] + 2;
if(!*iext)
iext = argv[++arg]; //space left after -i: use next argument
if (strncasecmp(iext, "MIME", 4) == 0)
{
// get the MIME type from the next argument
iext = argv[++arg];
pInFormat = Conv.FormatFromMIME(iext);
}
else
{
//The ID provided by the OBFormat class is used as the identifying file extension
pInFormat = Conv.FindFormat(iext);
}
if(pInFormat==NULL)
{
cerr << program_name << ": cannot read input format!" << endl;
usage();
}
break;
case 'o':
gotOutType = true;
oext = argv[arg] + 2;
if(!*oext)
oext = argv[++arg]; //space left after -i: use next argument
if (strncasecmp(oext, "MIME", 4) == 0)
{
// get the MIME type from the next argument
oext = argv[++arg];
pOutFormat = Conv.FormatFromMIME(oext);
}
else
pOutFormat = Conv.FindFormat(oext);
if(pOutFormat==NULL)
{
cerr << program_name << ": cannot write output format!" << endl;
usage();
}
break;
/*case 'F':
if(!Conv.SetOutFormat("fpt"))
cout << "FingerprintFormat needs to be loaded" << endl;
else
{
Conv.AddOption("F",OBConversion::OUTOPTIONS);
Conv.Write(NULL);
}
return 0;
*/
case 'L': //display a list of plugin type or classes
{
const char* param=NULL;
if(argc>arg+1)
param = argv[arg+2];
OBPlugin::List(argv[arg+1], param);
return 0;
}
case '?':
case 'H':
if(isalnum(argv[arg][2]) || arg==argc-2)
{
if(strncasecmp(argv[arg]+2,"all",3))
{
const char* pID= (arg==argc-2) ? argv[arg+1] : argv[arg]+2;
OBFormat* pFormat = Conv.FindFormat(pID);
if(pFormat)
{
cout << pID << " " << pFormat->Description() << endl;
if(pFormat->Flags() & NOTWRITABLE)
cout << " This format is Read-only" << endl;
if(pFormat->Flags() & NOTREADABLE)
cout << " This format is Write-only" << endl;
if(strlen(pFormat->SpecificationURL()))
cout << "Specification at: " << pFormat->SpecificationURL() << endl;
}
else
cout << "Format type: " << pID << " was not recognized" <<endl;
}
else
{
OBPlugin::List("formats","verbose");
}
}
else
help();
return 0;
case '-': //long option --name text
{
//Do nothing if name is empty
//Option's text is the next arg provided it doesn't start with -
char* nam = argv[arg]+2;
if(*nam != '\0')
{
string txt;
int i;
for(i=0; i<Conv.GetOptionParams(nam, OBConversion::GENOPTIONS)
&& arg<argc-1 && argv[arg+1];++i) //removed && *argv[arg+1]!='-'
{
if(!txt.empty()) txt+=' ';
txt += argv[++arg];
}
if(*nam=='-')
{
// Is a API directive, e.g.---errorlevel
//Send to the pseudoformat "obapi" (without any leading -)
OBConversion apiConv;
OBFormat* pAPI= OBConversion::FindFormat("obapi");
if(pAPI)
{
apiConv.SetOutFormat(pAPI);
apiConv.AddOption(nam+1, OBConversion::GENOPTIONS, txt.c_str());
apiConv.Write(NULL, &std::cout);
}
}
else
// Is a long option name, e.g --addtotitle
Conv.AddOption(nam,OBConversion::GENOPTIONS,txt.c_str());
}
}
break;
case 'm': //multiple output files
SplitOrBatch=true;
break;
case 'a': //single character input option
p = argv[arg]+2;
DoOption(p,Conv,OBConversion::INOPTIONS,arg,argc,argv);
break;
case 'x': //single character output option
p = argv[arg]+2;
DoOption(p,Conv,OBConversion::OUTOPTIONS,arg,argc,argv);
break;
default: //single character general option
p = argv[arg]+1;
DoOption(p,Conv,OBConversion::GENOPTIONS,arg,argc,argv);
break;
}
}
else
{
//filenames
if(!gotOutType)
FileList.push_back(argv[arg]);
else
OutputFileName = argv[arg];
}
}
}
if(!gotOutType) //the last file is the output
{
if(FileList.empty())
{
cerr << "No output file or format spec!" << endl;
usage();
}
OutputFileName = FileList.back();
FileList.pop_back();
}
#ifdef _WIN32
//Expand wildcards in input filenames and add to FileList
vector<string> tempFileList(FileList);
FileList.clear();
vector<string>::iterator itr;
for(itr=tempFileList.begin();itr!=tempFileList.end();++itr)
DLHandler::findFiles (FileList, *itr);
#endif
if (!gotInType)
{
if(FileList.empty())
{
cerr << "No input file or format spec!" <<endl;
usage();
}
}
if (!gotOutType)
{
pOutFormat = Conv.FormatFromExt(OutputFileName.c_str());
if(pOutFormat==NULL)
{
cerr << program_name << ": cannot write output format!" << endl;
usage();
}
}
if(!Conv.SetInFormat(pInFormat))
{
cerr << "Invalid input format" << endl;
usage();
}
if(!Conv.SetOutFormat(pOutFormat))
{
cerr << "Invalid output format" << endl;
usage();
}
if(SplitOrBatch)
{
//Put * into output file name before extension (or ext.gz)
if(OutputFileName.empty())
{
OutputFileName = "*.";
if (oext != NULL)
OutputFileName += oext;
}
else
{
string::size_type pos = OutputFileName.rfind(".gz");
if(pos==string::npos)
pos = OutputFileName.rfind('.');
else
pos = OutputFileName.rfind('.',pos-1);
if(pos==string::npos)
OutputFileName += '*';
else
OutputFileName.insert(pos,"*");
}
}
int count = Conv.FullConvert(FileList, OutputFileName, OutputFileList);
Conv.ReportNumberConverted(count);
if(OutputFileList.size()>1)
{
clog << OutputFileList.size() << " files output. The first is " << OutputFileList[0] <<endl;
}
std::string messageSummary = obErrorLog.GetMessageSummary();
if (messageSummary.size())
{
clog << messageSummary << endl;
}
#ifdef _DEBUG
//CM keep window open
cout << "Press any key to finish" <<endl;
getch();
#endif
return 0;
}
void DoOption(const char* p, OBConversion& Conv,
OBConversion::Option_type typ, int& arg, int argc, char *argv[])
{
while(p && *p) //can have multiple single char options
{
char ch[2]="?";
*ch = *p++;
const char* txt=NULL;
//Get the option text if needed
int nParams = Conv.GetOptionParams(ch, typ);
if(nParams)
{
if(*p)
{
txt = p; //use text immediately following the option letter
p=NULL; //no more single char options
}
else if(arg<argc-1)
{
txt = argv[++arg]; //use text from next arg
if(*txt=='-')
{
//...unless it is another option
cerr << "Option -" << ch << " takes a parameter" << endl;
exit(0);
}
}
}
Conv.AddOption(ch, typ, txt);
}
}
void usage()
{
cout << "Open Babel " << BABEL_VERSION << " -- " << __DATE__ << " -- "
<< __TIME__ << endl;
cout << "Usage: " << program_name
<< " [-i<input-type>] <name> [-o<output-type>] <name>" << endl;
cout << "Try -H option for more information." << endl;
#ifdef _DEBUG
//CM keep window open
cout << "Press any key to finish" <<endl;
getch();
#endif
exit (0);
}
void help()
{
cout << "Open Babel converts chemical structures from one file format to another"<< endl << endl;
cout << "Usage: " << program_name << " <input spec> <output spec> [Options]" << endl << endl;
cout << "Each spec can be a file whose extension decides the format." << endl;
cout << "Optionally the format can be specified by preceding the file by" << endl;
cout << "-i<format-type> e.g. -icml, for input and -o<format-type> for output" << endl << endl;
cout << "See below for available format-types, which are the same as the " << endl;
cout << "file extensions and are case independent." << endl;
cout << "If no input or output file is given stdin or stdout are used instead." << endl << endl;
cout << "More than one input file can be specified and their names can contain" <<endl;
cout << "wildcard chars (* and ?).The molecules are aggregated in the output file.\n" << endl;
cout << OBConversion::Description(); // Conversion options
cout << "-H Outputs this help text" << endl;
cout << "-Hxxx (xxx is file format ID e.g. -Hcml) gives format info" <<endl;
cout << "-Hall Outputs details of all formats" <<endl;
cout << "-V Outputs version number" <<endl;
cout << "-L <BaseType> Lists plugin classes of this type" << endl;
cout << " e.g. <fingerprints>, or <plugins> for a list of BaseTypes" << endl;
cout << "-m Produces multiple output files, to allow:" <<endl;
cout << " Splitting: e.g. " << program_name << " infile.mol new.smi -m" <<endl;
cout << " puts each molecule into new1.smi new2.smi etc" <<endl;
cout << " Batch conversion: e.g. " << program_name << " *.mol -osmi -m" <<endl;
cout << " converts each input file to a .smi file" << endl;
#ifdef _WIN32
cout << " In Windows these can also be done using the forms" <<endl;
cout << " " << program_name << " infile.mol new*.smi and " << program_name << " *.mol *.smi respectively.\n" <<endl;
#endif
OBFormat* pDefault = OBConversion::GetDefaultFormat();
if(pDefault)
cout << pDefault->TargetClassDescription();// some more options probably for OBMol
OBFormat* pAPI= OBConversion::FindFormat("obapi");
if(pAPI)
cout << pAPI->Description();
cout << "The following file formats are recognized:" << endl;
OBPlugin::List("formats");
cout << "\nSee further specific info and options using -H<format-type>, e.g. -Hcml" << endl;
}
/* OpenBabel man page*/
/** \page babel a converter for chemistry and molecular modeling data files
*
* \n
* \par SYNOPSIS
*
* \b babel [-H<help-options>] [-V] [-m] [-d] [-h] [-p] [-s<SMARTS-pattern>] [-v<SMARTS-pattern>] [-f<#> -l<#>] [-c] [-x<format-options>] [-i<input-type>] \<infile\> [-o<output-type>] \<outfile\>
*
* \par DESCRIPTION
*
* Open Babel is a program designed to interconvert a number of
* file formats currently used in molecular modeling software. \n\n
*
* Note that Open Babel can also be used as a library to interconvert
* many file formats and to provide standard chemistry software routines.
* See the Open Babel web pages (http://openbabel.sourceforge.net) for more
* information.
*
* \par OPTIONS
*
* If only input and ouput files are given, Open Babel will guess
* the file type from the filename extension. \n\n
*
* \b -V :
* Output version number and exit \n\n
* \b -H :
* Output usage information \n\n
* \b -H\<format-ID\> :
* Output formatting information and options for format specified\n\n
* \b -Hall :
* Output formatting information and options for all formats\n\n
* \b -i :
* Specifies input format, see below for the available formats \n\n
* \b -o :
* Specifies output format, see below for the available formats \n\n
* \b -m :
* Produce multiple output files, to allow:\n
* * Splitting one input file - put each molecule into consecutively numbered output files \n
* * Batch conversion - convert each of multiple input files into a specified output format \n
* See examples below \n\n
* \b -d :
* Delete Hydrogens \n\n
* \b -h :
* Add Hydrogens \n\n
* \b -p :
* Add Hydrogens appropriate for pH (use transforms in phmodel.txt) \n\n
* \b -t :
* All input files describe a single molecule \n\n
* \b -f\<#\> :
* For multiple entries input, start import at molecule # \n\n
* \b -l\<#\> :
* For multiple entries input, stop import at molecule # \n\n
* \b -c :
* Center atomic coordinates at (0,0,0) \n\n
* \b -s\<SMARTS\> :
* Convert only molecules matching the SMARTS pattern specified \n\n
* \b -v\<SMARTS\> :
* Convert only molecules \b NOT matching SMARTS pattern specified \n\n
*
* \par FILE FORMATS
*
* The following formats are currently supported by Open Babel:
* \n alc -- Alchemy format
* \n bgf -- BGF format
* \n box -- Dock 3.5 Box format
* \n bs -- Ball and Stick format
* \n c3d1 -- Chem3D Cartesian 1 format
* \n c3d2 -- Chem3D Cartesian2 format
* \n caccrt -- Cacao format
* \n cache -- CAChe format [Writeonly]
* \n cacint -- CacaoInternal format [Writeonly]
* \n car -- MSI Biosym/Insight II CAR format [Readonly]
* \n ccc -- CCC format [Readonly]
* \n cht -- ChemTool format [Writeonly]
* \n cml -- Chemical Markup Language
* \n crk2d -- Chemical Resource Kit diagram format (2D)
* \n crk3d -- Chemical Resource Kit 3D format
* \n csr -- CSR format [Writeonly]
* \n cssr -- CSD CSSR format [Writeonly]
* \n ct -- ChemDraw Connection Table format
* \n dmol -- DMol3 coordinates format
* \n ent -- Protein Data Bank format
* \n feat -- Feature format
* \n fh -- Fenske-Hall Z-Matrix format [Writeonly]
* \n fix -- FIX format [Writeonly]
* \n g03 -- Gaussian98/03 Cartesian [Writeonly]
* \n g98 -- Gaussian98/03 Cartesian [Writeonly]
* \n gam -- GAMESS Output
* \n gamout -- GAMESS Output
* \n gau -- Gaussian98/03 Cartesian [Writeonly]
* \n gpr -- Ghemical format
* \n gr96 -- GROMOS96 format [Writeonly]
* \n hin -- HyperChem Input format
* \n ins -- ShelX format [Readonly]
* \n jout -- Jaguar output format
* \n mdl -- MDL MOL format
* \n mm1gp -- Ghemical format
* \n mm3 -- MM3 format [Writeonly]
* \n mmd -- MacroMod format
* \n mmod -- MacroMod format
* \n mol -- MDL MOL format
* \n mol2 -- Sybyl Mol2 format
* \n mopcrt -- MOPAC Cartesian format
* \n mopout -- MOPAC Output format [Readonly]
* \n mpqc -- MPQC format [Readonly]
* \n nwo -- NWChem format
* \n pdb -- Protein Data Bank format
* \n pov -- POV-Ray input format [Writeonly]
* \n pqs -- Parallel Quantum Solutions format
* \n prep -- Amber Prep format [Readonly]
* \n qcout -- QChem output format
* \n qm1gp -- Ghemical format
* \n report -- Report format [Writeonly]
* \n res -- ShelX format [Readonly]
* \n rxn -- MDL RXN format
* \n sd -- MDL MOL format
* \n sdf -- MDL MOL format
* \n smi -- SMILES format
* \n tmol -- TurboMole Coordinate format
* \n txyz -- Tinker format [Writeonly]
* \n unixyz -- UniChem XYZ format
* \n vmol -- ViewMol format
* \n xed -- XED format [Writeonly]
* \n xyz -- XYZ cartesian coordinates format
* \n zin -- ZINDO input format [Writeonly]
*
* \par FORMAT OPTIONS
* Individual file formats may have additional formatting options. \n
* Input format options are preceded by 'a', e.g. -as \n
* Output format options are preceded by 'x', e.g. -xn \n
* For further specific information and options, use -H<format-type> \n
* e.g., -Hcml
*
* \par EXAMPLES
* - Standard conversion \n
* babel -ixyz ethanol.xyz -opdb ethanol.pdb \n
* - Conversion from a SMI file in STDIN to a Mol2 file written to STDOUT \n
* babel -ismi -omol2 \n
* - Split a multi-molecule file into new1.smi, new2.smi, etc. \n
* babel infile.mol new.smi -m \n
*
* \par AUTHORS
*
* Open Babel is currently maintained by \b Geoff \b Hutchison, \b Chris \b Morley and \b Michael \b Banck.
*
* For more contributors to Open Babel, see http://openbabel.sourceforge.net/THANKS.shtml
*
* \par COPYRIGHT
* Copyright (C) 1998-2001 by OpenEye Scientific Software, Inc.
* Some portions Copyright (C) 2001-2005 by Geoffrey R. Hutchison \n \n
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation version 2 of the License.\n \n
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* \par SEE ALSO
* The web pages for Open Babel can be found at http://openbabel.sourceforge.net/
**/
|