bpp-seq  2.2.0
Phylip.h
Go to the documentation of this file.
1 //
2 // File: Phylip.h
3 // Created by: Julien Dutheil
4 // Created on: Mon Oct 27 12:22:56 2003
5 //
6 
7 /*
8 Copyright or © or Copr. Bio++ Development Team, (November 17, 2004)
9 
10 This software is a computer program whose purpose is to provide classes
11 for sequences analysis.
12 
13 This software is governed by the CeCILL license under French law and
14 abiding by the rules of distribution of free software. You can use,
15 modify and/ or redistribute the software under the terms of the CeCILL
16 license as circulated by CEA, CNRS and INRIA at the following URL
17 "http://www.cecill.info".
18 
19 As a counterpart to the access to the source code and rights to copy,
20 modify and redistribute granted by the license, users are provided only
21 with a limited warranty and the software's author, the holder of the
22 economic rights, and the successive licensors have only limited
23 liability.
24 
25 In this respect, the user's attention is drawn to the risks associated
26 with loading, using, modifying and/or developing or reproducing the
27 software by the user in light of its specific status of free software,
28 that may mean that it is complicated to manipulate, and that also
29 therefore means that it is reserved for developers and experienced
30 professionals having in-depth computer knowledge. Users are therefore
31 encouraged to load and test the software's suitability as regards their
32 requirements in conditions enabling the security of their systems and/or
33 data to be ensured and, more generally, to use and operate it in the
34 same conditions as regards security.
35 
36 The fact that you are presently reading this means that you have had
37 knowledge of the CeCILL license and that you accept its terms.
38 */
39 
40 #ifndef _PHYLIP_H_
41 #define _PHYLIP_H_
42 
43 #include "AbstractIAlignment.h"
44 #include "AbstractOAlignment.h"
45 #include "../Sequence.h"
46 #include "../Container/SequenceContainer.h"
47 #include "../Container/VectorSequenceContainer.h"
48 #include "../Container/AlignedSequenceContainer.h"
49 
50 // From the STL:
51 #include <iostream>
52 
53 namespace bpp
54 {
55 
64 class Phylip :
65  public AbstractIAlignment,
66  public AbstractOAlignment,
67  public virtual ISequence
68 {
69  private:
70 
71  /* this class allows two kinds of Phylip format:
72  * traditional, with names limited to 10 chars,
73  * and 'extended', defined by PAML, with names separated from sequences by at least 6 white spaces.
74  */
75  bool extended_;
76  /* tells if sequences are in the seuqential or the interleave format/
77  */
79 
83  unsigned int charsByLine_;
84 
86 
87  std::string namesSplit_;
88 
89  public:
99  Phylip(bool extended = true, bool sequential = true, unsigned int charsByLine = 100, bool checkSequenceNames = true, const std::string& split = " "):
100  extended_(extended), sequential_(sequential), charsByLine_(charsByLine), checkNames_(checkSequenceNames), namesSplit_(split) {}
101 
102  virtual ~Phylip() {}
103 
104  public:
105 
111  void appendAlignmentFromStream(std::istream& input, SiteContainer& sc) const throw (Exception);
122  virtual SequenceContainer* readSequences(std::istream& input, const Alphabet* alpha) const throw (Exception) {
123  return readAlignment(input, alpha);
124  }
125  virtual SequenceContainer* readSequences(const std::string& path, const Alphabet* alpha) const throw (Exception) {
126  return readAlignment(path, alpha);
127  }
136  unsigned int getNumberOfSequences(const std::string& path) const throw (IOException);
137 
143  void writeAlignment(std::ostream& output, const SiteContainer& sc) const throw (Exception);
144  void writeAlignment(const std::string& path, const SiteContainer& sc, bool overwrite) const throw (Exception)
145  {
146  AbstractOAlignment::writeAlignment(path, sc, overwrite);
147  }
156  const std::string getFormatName() const;
157  const std::string getFormatDescription() const;
163  bool checkNames() const { return checkNames_; }
164 
170  void checkNames(bool yn) { checkNames_ = yn; }
171 
175  const std::string& getSplit() const { return namesSplit_; }
176 
180  void setSplit(const std::string& split) { namesSplit_ = split; }
181 
182  protected:
183  //Reading tools:
184  const std::vector<std::string> splitNameAndSequence(const std::string& s) const throw (Exception);
185  void readSequential (std::istream& in, SiteContainer& asc) const throw (Exception);
186  void readInterleaved(std::istream& in, SiteContainer& asc) const throw (Exception);
187  //Writing tools:
188  std::vector<std::string> getSizedNames(const std::vector<std::string>& names) const;
189  void writeSequential(std::ostream& out, const SequenceContainer& sc) const;
190  void writeInterleaved(std::ostream& out, const SequenceContainer& sc) const;
191 };
192 
193 } //end of namespace bpp.
194 
195 #endif //_PHYLIP_H_
196 
const std::string & getSplit() const
Definition: Phylip.h:175
bool extended_
Definition: Phylip.h:75
void checkNames(bool yn)
Tell whether the sequence names should be checked when reading from files.
Definition: Phylip.h:170
virtual SequenceContainer * readSequences(const std::string &path, const Alphabet *alpha) const
Create a new container from a file.
Definition: Phylip.h:125
unsigned int charsByLine_
The maximum number of chars to be written on a line.
Definition: Phylip.h:83
void writeInterleaved(std::ostream &out, const SequenceContainer &sc) const
Definition: Phylip.cpp:246
void readSequential(std::istream &in, SiteContainer &asc) const
Definition: Phylip.cpp:75
The SiteContainer interface.
Definition: SiteContainer.h:63
const std::string getFormatDescription() const
Definition: Phylip.cpp:298
This alphabet is used to deal NumericAlphabet.
std::vector< std::string > getSizedNames(const std::vector< std::string > &names) const
Definition: Phylip.cpp:201
void appendAlignmentFromStream(std::istream &input, SiteContainer &sc) const
Append sequences to a container from a stream.
Definition: Phylip.cpp:174
const std::string getFormatName() const
Definition: Phylip.cpp:294
bool checkNames_
Definition: Phylip.h:85
Partial implementation of the IAlignment interface, dedicated to alignment readers.
void readInterleaved(std::istream &in, SiteContainer &asc) const
Definition: Phylip.cpp:132
The Alphabet interface.
Definition: Alphabet.h:130
std::string namesSplit_
Definition: Phylip.h:87
bool sequential_
Definition: Phylip.h:78
void writeAlignment(const std::string &path, const SiteContainer &sc, bool overwrite) const
Write a container to a file.
Definition: Phylip.h:144
bool checkNames() const
Definition: Phylip.h:163
void writeAlignment(std::ostream &output, const SiteContainer &sc) const
Write a container to a stream.
Definition: Phylip.cpp:279
The Phylip & co format.
Definition: Phylip.h:64
Phylip(bool extended=true, bool sequential=true, unsigned int charsByLine=100, bool checkSequenceNames=true, const std::string &split=" ")
Build a new Phylip file reader.
Definition: Phylip.h:99
virtual SequenceContainer * readSequences(std::istream &input, const Alphabet *alpha) const
Create a new container from a stream.
Definition: Phylip.h:122
void writeSequential(std::ostream &out, const SequenceContainer &sc) const
Definition: Phylip.cpp:226
virtual ~Phylip()
Definition: Phylip.h:102
const std::vector< std::string > splitNameAndSequence(const std::string &s) const
Definition: Phylip.cpp:55
void setSplit(const std::string &split)
Definition: Phylip.h:180
unsigned int getNumberOfSequences(const std::string &path) const
Definition: Phylip.cpp:185
Partial implementation of the OAlignment interface.
The SequenceContainer interface.
virtual void readAlignment(std::istream &input, SiteContainer &sc) const
Add sequences to a container from a stream.
The ISequence interface.
Definition: ISequence.h:64
void writeAlignment(std::ostream &output, const SiteContainer &sc) const =0
Write a container to a stream.