BioPandas
diff --git a/‎.appveyor.yml‎
Lines changed: 23 additions & 0 deletions b/‎.appveyor.yml‎
Lines changed: 23 additions & 0 deletions
diff --git a/‎.github/PULL_REQUEST_TEMPLATE.md‎
Lines changed: 43 additions & 0 deletions b/‎.github/PULL_REQUEST_TEMPLATE.md‎
Lines changed: 43 additions & 0 deletions
diff --git a/‎README.md‎
Lines changed: 1 addition & 0 deletions b/‎README.md‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎biopandas/__init__.py‎
Lines changed: 1 addition & 1 deletion b/‎biopandas/__init__.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎biopandas/pdb/pandas_pdb.py‎
Lines changed: 63 additions & 9 deletions b/‎biopandas/pdb/pandas_pdb.py‎
Lines changed: 63 additions & 9 deletions
@@ -0,0 +1,23 @@
+build: false
+
+environment:
+  matrix:
+    - PYTHON_VERSION: 2.7
+      MINICONDA: C:\Miniconda
+    - PYTHON_VERSION: 3.5
+      MINICONDA: C:\Miniconda3
+
+init:
+  - ECHO %PYTHON_VERSION% %MINICONDA%
+  - ECHO conda --version
+
+install:
+  - set PATH=%MINICONDA%;%MINICONDA%\\Scripts;%PATH%
+  - conda config --set always_yes yes --set changeps1 no
+  - conda update -q conda
+  - conda info -a
+  - conda create -q -n test-environment python=%PYTHON_VERSION% numpy scipy pandas nose
+  - activate test-environment
+
+test_script:
+  - nosetests -s -v
@@ -0,0 +1,43 @@
+<!-- Please read the following guidelines for new Pull Requests -- thank you! -->
+
+<!--
+Make sure that you submit this pull request as a separate topic branch (and not to "master")
+-->
+
+<!-- Provide a small summary describing the Pull Request below -->
+
+### Description
+
+Insert Description Here
+
+### Related issues or pull requests
+
+<!-- Please provide a link to the respective issue on the [Issue Tracker](https://github.com/rasbt/mlxtend/issues) if one exists. E.g.,
+
+Fixes #<ISSUE_NUMBER> -->
+
+Link related issues/pull requests here
+
+<!-- Below is a general todo list for typical pull request -->
+
+### Pull Request requirements
+
+- [ ] Added appropriate unit test functions in the `./mlxtend/*/tests` directories
+- [ ] Ran `nosetests ./mlxtend -sv` and make sure that all unit tests pass
+- [ ] Checked the test coverage by running `nosetests ./mlxtend --with-coverage`
+- [ ] Checked for style issues by running `flake8 ./mlxtend`
+- [ ] Added a note about the modification or contribution to the `./docs/sources/`CHANGELOG.md` file
+- [ ] Modify documentation in the appropriate location under `mlxtend/docs/sources/` (optional)
+- [ ] Checked that the Travis-CI build passed at https://travis-ci.org/rasbt/mlxtend
+
+
+
+
+<!--
+NOTE
+
+Due to the improved GitHub UI, the squashing of commits is no longer necessary.
+Please DO NOT SQUASH commits since they help with keeping track of the changes during the discussion).
+
+For more information and instructions, please see http://rasbt.github.io/mlxtend/contributing/
+-->
@@ -4,6 +4,7 @@
 
 
 [![Continuous Integration](https://travis-ci.org/rasbt/biopandas.svg?branch=master)](https://travis-ci.org/rasbt/biopandas)
+[![Build status](https://ci.appveyor.com/api/projects/status/jcp91fvbgmqws30p/branch/master?svg=true)](https://ci.appveyor.com/project/rasbt/biopandas/branch/master)
 [![Code Coverage](https://coveralls.io/repos/rasbt/biopandas/badge.svg?branch=master&service=github)](https://coveralls.io/github/rasbt/biopandas?branch=master)
 [![Code Health](https://landscape.io/github/rasbt/biopandas/master/landscape.svg?style=flat)](https://landscape.io/github/rasbt/biopandas/master)
 [![PyPI Version](https://img.shields.io/pypi/v/biopandas.svg)](https://pypi.python.org/pypi/biopandas/)
 
@@ -4,5 +4,5 @@
 # Project Website: http://rasbt.github.io/biopandas/
 # Code Repository: https://github.com/rasbt/biopandas
 
-__version__ = '0.1.5.dev0'
+__version__ = '0.1.5'
 __author__ = "Sebastian Raschka <[email protected]>"
@@ -90,7 +90,7 @@ def get(self, s, df=None, invert=False):
 
         Parameters
         ----------
-        s : str  in {'main chain', 'hydrogen', 'c-alpha'}
+        s : str  in {'main chain', 'hydrogen', 'c-alpha', 'heavy'}
             String to specify which entries to return
 
         df : pandas.DataFrame, default: None
@@ -115,8 +115,41 @@ def get(self, s, df=None, invert=False):
             df = self._df['ATOM']
         return self._get_dict[s](df, invert=invert)
 
+    def impute_element(self, sections=['ATOM', 'HETATM'], inplace=False):
+        """Impute element_symbol from atom_name section.
+
+        Parameters
+        ----------
+        sections : iterable (default: ['ATOM', 'HETATM'])
+            Coordinate sections for which the element symbols should be
+            imputed.
+
+        inplace : bool (default: False)
+            Performs the operation in-place if True and returns a copy of the
+            PDB DataFrame otherwise.
+
+        Returns
+        ---------
+        DataFrame
+
+        """
+        if inplace:
+            t = self.df
+        else:
+            t = self.df.copy()
+            for d in self.df:
+                t[d] = self.df[d].copy()
+
+        for sec in sections:
+            t[sec]['element_symbol'] = \
+                t[sec][['atom_name', 'element_symbol']].\
+                apply(lambda x: x[0][1]
+                      if len(x[1]) == 3
+                      else x[0][0], axis=1)
+        return t
+
     @staticmethod
-    def rmsd(df1, df2, s='main chain', invert=False):
+    def rmsd(df1, df2, s=None, invert=False):
         """Compute the Root Mean Square Deviation between molecules.
 
         Parameters
@@ -128,8 +161,10 @@ def rmsd(df1, df2, s='main chain', invert=False):
             Second DataFrame for RMSD computation against df1. Must have the
             same number of entries as df1
 
-        s : str in {'main chain', 'hydrogen', 'c-alpha'}, default: 'main chain'
-            String to specify which entries to consider.
+        s : {'main chain', 'hydrogen', 'c-alpha', 'heavy', 'carbon'} or None,
+            default: None
+            String to specify which entries to consider. If None, considers
+            all atoms for comparison.
 
         invert : bool, default: False
             Inverts the string query if true. For example, the setting
@@ -163,7 +198,9 @@ def _init_get_dict():
         """Initialize dictionary for filter operations."""
         get_dict = {'main chain': PandasPDB._get_mainchain,
                     'hydrogen': PandasPDB._get_hydrogen,
-                    'c-alpha': PandasPDB._get_calpha}
+                    'c-alpha': PandasPDB._get_calpha,
+                    'carbon': PandasPDB._get_carbon,
+                    'heavy': PandasPDB._get_heavy}
         return get_dict
 
     @staticmethod
@@ -234,9 +271,17 @@ def _get_mainchain(df, invert):
     def _get_hydrogen(df, invert):
         """Return only hydrogen atom entries from a DataFrame"""
         if invert:
-            return df[(df['atom_name'] != 'H')]
+            return df[(df['element_symbol'] != 'H')]
+        else:
+            return df[(df['element_symbol'] == 'H')]
+
+    @staticmethod
+    def _get_heavy(df, invert):
+        """Return only heavy atom entries from a DataFrame"""
+        if invert:
+            return df[df['element_symbol'] == 'H']
         else:
-            return df[(df['atom_name'] == 'H')]
+            return df[df['element_symbol'] != 'H']
 
     @staticmethod
     def _get_calpha(df, invert):
@@ -246,6 +291,14 @@ def _get_calpha(df, invert):
         else:
             return df[df['atom_name'] == 'CA']
 
+    @staticmethod
+    def _get_carbon(df, invert):
+        """Return c-alpha atom entries from a DataFrame"""
+        if invert:
+            return df[df['element_symbol'] == 'C']
+        else:
+            return df[df['element_symbol'] != 'C']
+
     @staticmethod
     def _construct_df(pdb_lines):
         """Construct DataFrames from list of PDB lines."""
@@ -256,7 +309,8 @@ def _construct_df(pdb_lines):
             if line.strip():
                 if line.startswith(valids):
                     record = line[:6].rstrip()
-                    line_ele = ['' for _ in range(len(pdb_records[record])+1)]
+                    line_ele = ['' for _ in range(len(
+                        pdb_records[record]) + 1)]
                     for idx, ele in enumerate(pdb_records[record]):
                         line_ele[idx] = (line[ele['line'][0]:ele['line'][1]]
                                          .strip())
@@ -269,7 +323,7 @@ def _construct_df(pdb_lines):
         dfs = {}
         for r in line_lists.items():
             df = pd.DataFrame(r[1], columns=[c['id'] for c in
-                                             pdb_records[r[0]]]+['line_idx'])
+                                             pdb_records[r[0]]] + ['line_idx'])
             for c in pdb_records[r[0]]:
                 try:
                     df[c['id']] = df[c['id']].astype(c['type'])