Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Typo fixes #1

Open
wants to merge 1 commit into
base: main
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 1 addition & 1 deletion bio_clip/data/downstream/pesto_src/structure.py
Original file line number Diff line number Diff line change
Expand Up @@ -44,7 +44,7 @@ def clean_structure(structure):
)[1]
delta_chains = np.abs(np.sign(np.concatenate([[0], np.diff(ids_chains)])))

# find changes due to inertion code
# find changes due to insertion code
icodes = structure["icode"]
ids_icodes = np.where(
np.array(icodes).reshape(-1, 1) == np.unique(icodes).reshape(1, -1)
Expand Down
2 changes: 1 addition & 1 deletion bio_clip/data/downstream/ppi.py
Original file line number Diff line number Diff line change
Expand Up @@ -122,7 +122,7 @@ def cropping_dependent_processing(
):
"""This task is now deprecated as there were problems found in the original paper.
Additionally, this task was previously pre-processed using an old version of the
BioCLIP code which we do not provide. Data-transform dependend pre-processing takes
BioCLIP code which we do not provide. Data-transform dependent pre-processing takes
quite long, thus it is processed in parallel, cached, then training is performed.

Args:
Expand Down
2 changes: 1 addition & 1 deletion bio_clip/model/gnn.py
Original file line number Diff line number Diff line change
Expand Up @@ -23,7 +23,7 @@


class PositionalEncodingLayer(hk.Module):
"""Independent-Equivariant Graph Matching Newtork"""
"""Independent-Equivariant Graph Matching Network"""

def __init__(self, positional_encoding_dimension: int):
"""Initializes a Positional Encoding Layer
Expand Down
2 changes: 1 addition & 1 deletion bio_clip/train/data_transforms.py
Original file line number Diff line number Diff line change
Expand Up @@ -480,7 +480,7 @@ def crop_pad(data, multiply_by):
atom14_mask.astype(np.float32),
)

# I am cropping tokens manually here, because the filter guarentees the num residues
# I am cropping tokens manually here, because the filter guarantees the num residues
# is below padding_num_residue
tokens = tokens[:padding_num_residue]

Expand Down
2 changes: 1 addition & 1 deletion bio_clip/train/pretrain/dataloader.py
Original file line number Diff line number Diff line change
Expand Up @@ -25,7 +25,7 @@ class BioClipDataloaderParams:
# files. The filepaths can be GCP bucket filepaths (in which case they should start
# with gs://)
batch_dims: Tuple[int, ...] # Batches of training samples will be reshaped to this
# shape before being outputed (the effective batch size is np.prod(batch_dims)).
# shape before being outputted (the effective batch size is np.prod(batch_dims)).
# This is useful for preparing the batches in a shape that matches what jax.pmap and
# jax.vmap expect.
shuffle: bool = True # If True, shuffle the filepaths at the beginning of all
Expand Down
2 changes: 1 addition & 1 deletion bio_clip/train/pretrain/trainer.py
Original file line number Diff line number Diff line change
Expand Up @@ -342,7 +342,7 @@ def predict(

Returns:
loss (float): Training Loss.
aux_metrics (dict): Auxillary metrics.
aux_metrics (dict): Auxiliary metrics.
"""
mean = (
jnp.mean
Expand Down
2 changes: 1 addition & 1 deletion bio_clip/utils/utils.py
Original file line number Diff line number Diff line change
Expand Up @@ -132,7 +132,7 @@ def _background_thread(self) -> None:
def convert_to_ml_dict(dct: Union[DictConfig, Any]) -> Union[ConfigDict, Any]:
"""
This function converts the DictConfig returned by Hydra
into a ConfigDict. The recusion allows to convert
into a ConfigDict. The recursion allows to convert
all the nested DictConfig elements of the config. The recursion stops
once the reached element is not a DictConfig.
"""
Expand Down
2 changes: 1 addition & 1 deletion build-source/Dockerfile
Original file line number Diff line number Diff line change
Expand Up @@ -53,7 +53,7 @@ RUN ln -s /app/bio-clip/bio_clip /opt/conda/envs/bioclip/lib/python3.9/site-pack

# Disable debug, info, and warning tensorflow logs
ENV TF_CPP_MIN_LOG_LEVEL=3
# # By default use cpu as the backend for JAX, we will explicitely load data on gpus/tpus as needed.
# # By default use cpu as the backend for JAX, we will explicitly load data on gpus/tpus as needed.
# ENV JAX_PLATFORM_NAME="cpu"

# aws
Expand Down
4 changes: 2 additions & 2 deletions datasets/pretraining/create/data_processing.py
Original file line number Diff line number Diff line change
Expand Up @@ -586,7 +586,7 @@ def compute_graph_of_protein(
raw PDB data for the ligand sorted by residue
stacked_residue_coordinates (Coordinates):
list of residue coordinates for the ligand
num_neighbor (int, optional): number of nearest neigbors in the graph.
num_neighbor (int, optional): number of nearest neighbors in the graph.
Defaults to None.
residue_loc_is_alphac (bool, optional): whether the alpha-C atom
is used for residue center. Defaults to True.
Expand Down Expand Up @@ -828,7 +828,7 @@ def get_residues_db5(pdb_filename: str) -> List[SortedPdbData]:

Returns:
List of residues, each residue being represented by:
chain, residue, resname and all atom informations
chain, residue, resname and all atom information
"""
df = PandasPdb().read_pdb(pdb_filename)
df = df.df["ATOM"]
Expand Down