|
2 | 2 | "cells": [ |
3 | 3 | { |
4 | 4 | "cell_type": "code", |
5 | | - "execution_count": 3, |
| 5 | + "execution_count": 1, |
6 | 6 | "metadata": {}, |
7 | | - "outputs": [], |
| 7 | + "outputs": [ |
| 8 | + { |
| 9 | + "name": "stderr", |
| 10 | + "output_type": "stream", |
| 11 | + "text": [ |
| 12 | + "2024-06-06 10:26:46.074236: I tensorflow/core/platform/cpu_feature_guard.cc:210] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n", |
| 13 | + "To enable the following instructions: AVX2 FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n", |
| 14 | + "2024-06-06 10:26:46.608196: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n" |
| 15 | + ] |
| 16 | + } |
| 17 | + ], |
8 | 18 | "source": [ |
9 | 19 | "import numpy as np\n", |
10 | 20 | "import tensorflow as tf\n", |
|
21 | 31 | }, |
22 | 32 | { |
23 | 33 | "cell_type": "code", |
24 | | - "execution_count": 18, |
| 34 | + "execution_count": 5, |
25 | 35 | "metadata": {}, |
26 | 36 | "outputs": [], |
27 | 37 | "source": [ |
28 | 38 | "# Folder path\n", |
29 | | - "DATASET_DIR = './datasets/zinc-preprocess/'\n", |
| 39 | + "DATASET_DIR = './datasets/'\n", |
30 | 40 | "MAPPING_DIR = './mapping/'\n", |
31 | 41 | "\n", |
32 | 42 | "# SMILES path\n", |
|
40 | 50 | }, |
41 | 51 | { |
42 | 52 | "cell_type": "code", |
43 | | - "execution_count": 19, |
| 53 | + "execution_count": 6, |
44 | 54 | "metadata": {}, |
45 | 55 | "outputs": [ |
46 | 56 | { |
|
66 | 76 | }, |
67 | 77 | { |
68 | 78 | "cell_type": "code", |
69 | | - "execution_count": 4, |
| 79 | + "execution_count": 7, |
70 | 80 | "metadata": {}, |
71 | 81 | "outputs": [ |
72 | 82 | { |
73 | 83 | "name": "stderr", |
74 | 84 | "output_type": "stream", |
75 | 85 | "text": [ |
76 | | - "100%|██████████| 319616985/319616985 [5:27:12<00:00, 16279.95it/s] " |
| 86 | + "100%|██████████| 2/2 [00:00<00:00, 31655.12it/s]" |
77 | 87 | ] |
78 | 88 | }, |
79 | 89 | { |
80 | 90 | "name": "stdout", |
81 | 91 | "output_type": "stream", |
82 | 92 | "text": [ |
83 | | - "Total number of SMILES: 39\n" |
| 93 | + "Total number of SMILES: 2\n" |
84 | 94 | ] |
85 | 95 | }, |
86 | 96 | { |
|
108 | 118 | }, |
109 | 119 | { |
110 | 120 | "cell_type": "code", |
111 | | - "execution_count": 6, |
| 121 | + "execution_count": 8, |
112 | 122 | "metadata": {}, |
113 | 123 | "outputs": [ |
114 | 124 | { |
115 | 125 | "data": { |
116 | 126 | "text/plain": [ |
117 | | - "{'C': 1,\n", |
118 | | - " '@': 2,\n", |
119 | | - " '[': 3,\n", |
120 | | - " ']': 4,\n", |
121 | | - " 'H': 5,\n", |
122 | | - " '1': 6,\n", |
123 | | - " '2': 7,\n", |
124 | | - " 'O': 8,\n", |
125 | | - " '(': 9,\n", |
126 | | - " ')': 10,\n", |
127 | | - " 'N': 11,\n", |
128 | | - " '=': 12,\n", |
129 | | - " '3': 13,\n", |
130 | | - " 'l': 14,\n", |
131 | | - " 'S': 15,\n", |
132 | | - " '#': 16,\n", |
133 | | - " 'B': 17,\n", |
134 | | - " 'r': 18,\n", |
135 | | - " 'F': 19,\n", |
136 | | - " '4': 20,\n", |
137 | | - " '/': 21,\n", |
138 | | - " 'c': 22,\n", |
139 | | - " '+': 23,\n", |
140 | | - " '\\\\': 24,\n", |
141 | | - " 'P': 25,\n", |
142 | | - " '-': 26,\n", |
143 | | - " 'I': 27,\n", |
144 | | - " 'n': 28,\n", |
145 | | - " 'o': 29,\n", |
146 | | - " '<START>': 30,\n", |
147 | | - " '<PAD>': 31,\n", |
148 | | - " '<EOL>': 32}" |
| 127 | + "{'C': 1, 'c': 2, '<START>': 3, '<PAD>': 4, '<EOL>': 5}" |
149 | 128 | ] |
150 | 129 | }, |
151 | | - "execution_count": 6, |
| 130 | + "execution_count": 8, |
152 | 131 | "metadata": {}, |
153 | 132 | "output_type": "execute_result" |
154 | 133 | } |
|
165 | 144 | }, |
166 | 145 | { |
167 | 146 | "cell_type": "code", |
168 | | - "execution_count": 8, |
| 147 | + "execution_count": 9, |
169 | 148 | "metadata": {}, |
170 | 149 | "outputs": [ |
171 | 150 | { |
172 | 151 | "data": { |
173 | 152 | "text/plain": [ |
174 | | - "{1: 'C',\n", |
175 | | - " 2: '@',\n", |
176 | | - " 3: '[',\n", |
177 | | - " 4: ']',\n", |
178 | | - " 5: 'H',\n", |
179 | | - " 6: '1',\n", |
180 | | - " 7: '2',\n", |
181 | | - " 8: 'O',\n", |
182 | | - " 9: '(',\n", |
183 | | - " 10: ')',\n", |
184 | | - " 11: 'N',\n", |
185 | | - " 12: '=',\n", |
186 | | - " 13: '3',\n", |
187 | | - " 14: 'l',\n", |
188 | | - " 15: 'S',\n", |
189 | | - " 16: '#',\n", |
190 | | - " 17: 'B',\n", |
191 | | - " 18: 'r',\n", |
192 | | - " 19: 'F',\n", |
193 | | - " 20: '4',\n", |
194 | | - " 21: '/',\n", |
195 | | - " 22: 'c',\n", |
196 | | - " 23: '+',\n", |
197 | | - " 24: '\\\\',\n", |
198 | | - " 25: 'P',\n", |
199 | | - " 26: '-',\n", |
200 | | - " 27: 'I',\n", |
201 | | - " 28: 'n',\n", |
202 | | - " 29: 'o',\n", |
203 | | - " 30: '<START>',\n", |
204 | | - " 31: '<PAD>',\n", |
205 | | - " 32: '<EOL>'}" |
| 153 | + "{1: 'C', 2: 'c', 3: '<START>', 4: '<PAD>', 5: '<EOL>'}" |
206 | 154 | ] |
207 | 155 | }, |
208 | | - "execution_count": 8, |
| 156 | + "execution_count": 9, |
209 | 157 | "metadata": {}, |
210 | 158 | "output_type": "execute_result" |
211 | 159 | } |
|
218 | 166 | }, |
219 | 167 | { |
220 | 168 | "cell_type": "code", |
221 | | - "execution_count": 9, |
| 169 | + "execution_count": 10, |
222 | 170 | "metadata": {}, |
223 | 171 | "outputs": [], |
224 | 172 | "source": [ |
|
252 | 200 | "name": "python", |
253 | 201 | "nbconvert_exporter": "python", |
254 | 202 | "pygments_lexer": "ipython3", |
255 | | - "version": "3.6.9" |
| 203 | + "version": "3.10.14" |
256 | 204 | } |
257 | 205 | }, |
258 | 206 | "nbformat": 4, |
|
0 commit comments