Spaces:

vignt97867896
/

bioflow

Sleeping

App Files Files Community

bioflow / open_biomed /models /functional_model.py

Rami-Troudi

Phase 1: FastAPI integration with DeepPurpose DTI predictor

adecc9b 5 months ago

Raw

History Blame

3.85 kB

	from abc import ABC, abstractmethod
	from typing import Any, Dict, List, Optional, Tuple, Union
	from enum import Enum, auto

	import torch

	from open_biomed.data import Molecule, Protein, Text
	from open_biomed.models.base_model import BaseModel
	from open_biomed.utils.collator import Collator
	from open_biomed.utils.config import Config
	from open_biomed.utils.featurizer import MoleculeFeaturizer, ProteinFeaturizer, TextFeaturizer, Featurized

	class MoleculeModel(BaseModel):
	def __init__(self, model_cfg: Config) -> None:
	super(MoleculeModel, self).__init__(model_cfg)

	@abstractmethod
	def get_molecule_processor(self) -> Tuple[MoleculeFeaturizer, Collator]:
	raise NotImplementedError

	class MoleculeEncoder(MoleculeModel):
	def __init__(self, model_cfg: Config) -> None:
	super(MoleculeEncoder, self).__init__(model_cfg)

	@abstractmethod
	def encode_loss(self, label: Featurized[Molecule], **kwargs) -> Dict[str, torch.Tensor]:
	raise NotImplementedError

	@abstractmethod
	def encode_molecule(self, molecule: Union[List[Molecule], Any]) -> torch.Tensor:
	raise NotImplementedError

	class MoleculeDecoder(MoleculeModel):
	def __init__(self, model_cfg: Config) -> None:
	super(MoleculeDecoder, self).__init__(model_cfg)

	@abstractmethod
	def generate_loss(self, label: Featurized[Molecule], **kwargs) -> Dict[str, torch.Tensor]:
	raise NotImplementedError

	@abstractmethod
	def generate_molecule(self, **kwargs) -> List[Molecule]:
	raise NotImplementedError

	class ProteinModel(BaseModel):
	def __init__(self, model_cfg: Config) -> None:
	super().__init__(model_cfg)

	@abstractmethod
	def get_protein_processor(self) -> Tuple[ProteinFeaturizer, Collator]:
	raise NotImplementedError

	class ProteinEncoder(ProteinModel):
	def __init__(self, model_cfg: Config) -> None:
	super().__init__(model_cfg)

	@abstractmethod
	def encode_protein(self, protein: Union[Featurized[Protein], List[Protein]], **kwargs) -> torch.Tensor:
	raise NotImplementedError

	class ProteinDecoder(ProteinModel):
	def __init__(self, model_cfg: Config) -> None:
	super().__init__(model_cfg)

	@abstractmethod
	def generate_loss(self, label: Featurized[Protein], **kwargs) -> Dict[str, torch.Tensor]:
	raise NotImplementedError

	@abstractmethod
	def generate_protein(self, **kwargs) -> List[Protein]:
	raise NotImplementedError

	class TextEncoder(BaseModel, ABC):
	def __init__(self, model_cfg: Config) -> None:
	super(TextEncoder, self).__init__(model_cfg)

	@abstractmethod
	def get_text_processor(self) -> Tuple[TextFeaturizer, Collator]:
	raise NotImplementedError

	@abstractmethod
	def encode_text(self, text: Union[List[Text], Any]) -> torch.Tensor:
	raise NotImplementedError

	class ChatModel(BaseModel, ABC):
	class Role(Enum):
	USER = auto()
	ASSISTANT = auto()

	role_dict = {
	Role.USER: "USER",
	Role.ASSISTANT: "ASSISTANT",
	}
	def __init__(self, model_cfg: Config) -> None:
	super().__init__(model_cfg)
	self.messages = []

	def add_message(self, role: Role, message: Optional[str]) -> None:
	self.messages.append([role, message])

	def compose_context(self):
	ret = self.config.system_prompt + self.config.sep_tokens + " "
	for role, message in self.messages:
	if message:
	ret += self.role_dict[role] + ": " + message + " " + self.config.sep_tokens + " "
	else:
	ret += self.role_dict[role] + ": "
	return ret

	@abstractmethod
	def chat(self, user_prompt: Text) -> Text:
	raise NotImplementedError

	@abstractmethod
	def reset(self) -> None:
	raise NotImplementedError