bioinf-jku
diff --git a/‎.github/workflows/test_dev.yml
+40 b/‎.github/workflows/test_dev.yml
+40
diff --git a/‎.github/workflows/test_master.yml
+40 b/‎.github/workflows/test_master.yml
+40
diff --git a/‎README.md
+13-1 b/‎README.md
+13-1
diff --git a/‎example.ipynb
+61-24 b/‎example.ipynb
+61-24
diff --git a/‎fcd/__init__.py
+13-3 b/‎fcd/__init__.py
+13-3
@@ -0,0 +1,40 @@
+# This workflow will install Python dependencies, run tests and lint with a variety of Python versions
+# For more information see: https://docs.github.com/en/actions/automating-builds-and-tests/building-and-testing-python
+
+name: Tests (dev)
+
+on:
+  push:
+    branches: [ "dev" ]
+  pull_request:
+    branches: [ "dev" ]
+
+jobs:
+  build:
+
+    runs-on: ubuntu-latest
+    strategy:
+      fail-fast: false
+      matrix:
+        python-version: ["3.8", "3.9", "3.10", "3.11", "3.12"]
+
+    steps:
+    - uses: actions/checkout@v4
+    - name: Set up Python ${{ matrix.python-version }}
+      uses: actions/setup-python@v5
+      with:
+        python-version: ${{ matrix.python-version }}
+    - name: Install dependencies
+      run: |
+        python -m pip install --upgrade pip
+        python -m pip install flake8 pytest
+        python -m pip install -e .
+    - name: Lint with flake8
+      run: |
+        # stop the build if there are Python syntax errors or undefined names
+        flake8 . --count --select=E9,F63,F7,F82 --show-source --statistics
+        # exit-zero treats all errors as warnings. The GitHub editor is 127 chars wide
+        flake8 . --count --exit-zero --max-complexity=10 --max-line-length=127 --statistics
+    - name: Test with pytest
+      run: |
+        pytest
@@ -0,0 +1,40 @@
+# This workflow will install Python dependencies, run tests and lint with a variety of Python versions
+# For more information see: https://docs.github.com/en/actions/automating-builds-and-tests/building-and-testing-python
+
+name: Tests (master)
+
+on:
+  push:
+    branches: [ "master"]
+  pull_request:
+    branches: [ "master"]
+
+jobs:
+  build:
+
+    runs-on: ubuntu-latest
+    strategy:
+      fail-fast: false
+      matrix:
+        python-version: ["3.8", "3.9", "3.10", "3.11", "3.12"]
+
+    steps:
+    - uses: actions/checkout@v4
+    - name: Set up Python ${{ matrix.python-version }}
+      uses: actions/setup-python@v5
+      with:
+        python-version: ${{ matrix.python-version }}
+    - name: Install dependencies
+      run: |
+        python -m pip install --upgrade pip
+        python -m pip install flake8 pytest
+        python -m pip install -e .
+    - name: Lint with flake8
+      run: |
+        # stop the build if there are Python syntax errors or undefined names
+        flake8 . --count --select=E9,F63,F7,F82 --show-source --statistics
+        # exit-zero treats all errors as warnings. The GitHub editor is 127 chars wide
+        flake8 . --count --exit-zero --max-complexity=10 --max-line-length=127 --statistics
+    - name: Test with pytest
+      run: |
+        pytest
@@ -1,15 +1,27 @@
 # Fréchet ChemNet Distance
+![PyPI](https://img.shields.io/pypi/v/fcd)
+![Tests (master)](https://github.com/bioinf-jku/fcd/actions/workflows/test_master.yml/badge.svg?branch=dev)
+![Tests (dev)](https://github.com/bioinf-jku/fcd/actions/workflows/test_dev.yml/badge.svg?branch=dev)
+![PyPI - Downloads](https://img.shields.io/pypi/dm/fcd)
+![GitHub release (latest by date)](https://img.shields.io/github/v/release/bioinf-jku/fcd)
+![GitHub release date](https://img.shields.io/github/release-date/bioinf-jku/fcd)
+![GitHub](https://img.shields.io/github/license/bioinf-jku/fcd)
+
 
 Code for the paper "Fréchet ChemNet Distance: A Metric for Generative Models for Molecules in Drug Discovery"
 [JCIM](https://pubs.acs.org/doi/10.1021/acs.jcim.8b00234) /
 [ArXiv](https://arxiv.org/abs/1803.09518)
 
 
 ## Installation
-You can install the FCD using
+You can install FCD using
 ```
 pip install fcd
 ```
+or run the example notebook on Google Colab  <a href="https://colab.research.google.com/github/bioinf-jku/FCD/blob/master/example.ipynb">
+   <img src="https://colab.research.google.com/assets/colab-badge.svg">
+</a>.
+
 
 # Requirements
 ```
 
@@ -2,20 +2,58 @@
  "cells": [
   {
    "cell_type": "code",
-   "execution_count": 1,
+   "execution_count": 22,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "%%capture\n",
+    "!pip install fcd"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 23,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "--2024-04-01 18:53:15--  https://raw.githubusercontent.com/bioinf-jku/FCD/master/generated_smiles/LSTM_Segler.smi\n",
+      "Resolving raw.githubusercontent.com (raw.githubusercontent.com)... 185.199.109.133, 185.199.108.133, 185.199.111.133, ...\n",
+      "Connecting to raw.githubusercontent.com (raw.githubusercontent.com)|185.199.109.133|:443... connected.\n",
+      "HTTP request sent, awaiting response... 200 OK\n",
+      "Length: 22730454 (22M) [text/plain]\n",
+      "Saving to: ‘generated_smiles/LSTM_Segler.smi’\n",
+      "\n",
+      "generated_smiles/LS 100%[===================>]  21.68M  3.07MB/s    in 7.3s    \n",
+      "\n",
+      "2024-04-01 18:53:22 (2.98 MB/s) - ‘generated_smiles/LSTM_Segler.smi’ saved [22730454/22730454]\n",
+      "\n"
+     ]
+    }
+   ],
+   "source": [
+    "!mkdir generated_smiles -p\n",
+    "!wget https://raw.githubusercontent.com/bioinf-jku/FCD/master/generated_smiles/LSTM_Segler.smi -O generated_smiles/LSTM_Segler.smi"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 24,
    "metadata": {},
    "outputs": [],
    "source": [
     "import os\n",
-    "from rdkit import RDLogger                                                                                                                                                               \n",
+    "from rdkit import RDLogger\n",
     "import numpy as np\n",
-    "import pandas as pd\n",
-    "from fcd import get_fcd, load_ref_model,canonical_smiles, get_predictions, calculate_frechet_distance\n",
     "\n",
-    "RDLogger.DisableLog('rdApp.*')\n",
+    "from fcd import get_fcd, load_ref_model, canonical_smiles, get_predictions, calculate_frechet_distance\n",
+    "\n",
+    "RDLogger.DisableLog(\"rdApp.*\")\n",
     "\n",
     "np.random.seed(0)\n",
-    "os.environ[\"CUDA_VISIBLE_DEVICES\"]= '0' #set gpu"
+    "os.environ[\"CUDA_VISIBLE_DEVICES\"] = \"0\"  # set gpu"
    ]
   },
   {
@@ -31,7 +69,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 2,
+   "execution_count": 25,
    "metadata": {
     "ExecuteTime": {
      "end_time": "2020-04-23T09:13:50.403933Z",
@@ -44,8 +82,11 @@
     "model = load_ref_model()\n",
     "\n",
     "# Load generated molecules\n",
-    "gen_mol_file = \"generated_smiles/LSTM_Segler.smi\" #input file which contains one generated SMILES per line\n",
-    "gen_mol = pd.read_csv(gen_mol_file,header=None)[0] #IMPORTANT: take at least 10000 molecules as FCD can vary with sample size \n",
+    "gen_mol_file = \"generated_smiles/LSTM_Segler.smi\"  # input file which contains one generated SMILES per line\n",
+    "with open(gen_mol_file) as f:\n",
+    "    gen_mol = f.read().split(\"\\n\")\n",
+    "\n",
+    "# IMPORTANT: take at least 10000 molecules as FCD can vary with sample size\n",
     "sample1 = np.random.choice(gen_mol, 10000, replace=False)\n",
     "sample2 = np.random.choice(gen_mol, 10000, replace=False)\n",
     "\n",
@@ -65,7 +106,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 3,
+   "execution_count": 26,
    "metadata": {
     "ExecuteTime": {
      "end_time": "2020-04-23T09:11:27.207953Z",
@@ -77,12 +118,12 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "FCD:  0.333862289051325\n"
+      "FCD:  0.3298386855756661\n"
      ]
     }
    ],
    "source": [
-    "#get CHEBMLNET activations of generated molecules \n",
+    "# get CHEBMLNET activations of generated molecules\n",
     "act1 = get_predictions(model, can_sample1)\n",
     "act2 = get_predictions(model, can_sample2)\n",
     "\n",
@@ -92,18 +133,14 @@
     "mu2 = np.mean(act2, axis=0)\n",
     "sigma2 = np.cov(act2.T)\n",
     "\n",
-    "fcd_score = calculate_frechet_distance(\n",
-    "    mu1=mu1,\n",
-    "    mu2=mu2, \n",
-    "    sigma1=sigma1,\n",
-    "    sigma2=sigma2)\n",
+    "fcd_score = calculate_frechet_distance(mu1=mu1, mu2=mu2, sigma1=sigma1, sigma2=sigma2)\n",
     "\n",
-    "print('FCD: ',fcd_score)"
+    "print(\"FCD: \", fcd_score)"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 4,
+   "execution_count": 27,
    "metadata": {
     "ExecuteTime": {
      "end_time": "2020-04-23T09:11:38.873496Z",
@@ -115,20 +152,20 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "FCD:  0.333862289051325\n"
+      "FCD:  0.3298386855756661\n"
      ]
     }
    ],
    "source": [
     "\"\"\"if you don't need to store the activations you can also take a shortcut.\"\"\"\n",
     "fcd_score = get_fcd(can_sample1, can_sample2, model)\n",
     "\n",
-    "print('FCD: ',fcd_score)"
+    "print(\"FCD: \", fcd_score)"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 5,
+   "execution_count": 28,
    "metadata": {
     "ExecuteTime": {
      "end_time": "2020-04-23T09:11:49.760022Z",
@@ -140,14 +177,14 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "FCD:  25.635578193222216\n"
+      "FCD:  25.552174526889033\n"
      ]
     }
    ],
    "source": [
     "\"\"\"This is what happens if you do not canonicalize the smiles\"\"\"\n",
     "fcd_score = get_fcd(can_sample1, sample2, model)\n",
-    "print('FCD: ',fcd_score)"
+    "print(\"FCD: \", fcd_score)"
    ]
   }
  ],
 
@@ -1,4 +1,14 @@
-from .fcd import get_fcd, get_predictions, load_ref_model
-from .utils import calculate_frechet_distance, canonical_smiles
+# ruff: noqa: F401
 
-__version__ = "1.2"
+from fcd.fcd import get_fcd, get_predictions, load_ref_model
+from fcd.utils import calculate_frechet_distance, canonical_smiles
+
+__all__ = [
+    "get_fcd",
+    "get_predictions",
+    "load_ref_model",
+    "calculate_frechet_distance",
+    "canonical_smiles",
+]
+
+__version__ = "1.2.2"