Skip to content

Commit

Permalink
Fix and detached the dependency on the ui as git module
Browse files Browse the repository at this point in the history
  • Loading branch information
SasCezar committed Oct 3, 2024
1 parent 8fc9f9f commit 4db2a0c
Show file tree
Hide file tree
Showing 15 changed files with 42 additions and 43 deletions.
3 changes: 0 additions & 3 deletions .gitmodules
Original file line number Diff line number Diff line change
@@ -1,3 +0,0 @@
[submodule "autofl-ui"]
path = autofl-ui
url = git@github.com:SasCezar/autofl-ui.git
1 change: 0 additions & 1 deletion autofl-ui
Submodule autofl-ui deleted from b697f2
2 changes: 1 addition & 1 deletion config/main.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,7 @@ defaults:
- _self_
- local: docker
- taxonomy: gitranking
- annotator: simple
- annotator: default
- version_strategy: latest
- dataloader: postgres
- writer: postgres
Expand Down
9 changes: 1 addition & 8 deletions docker-compose.yaml
Original file line number Diff line number Diff line change
@@ -1,4 +1,3 @@
version: "3.8"
services:
api:
build:
Expand Down Expand Up @@ -39,16 +38,10 @@ services:
- "8080:8080"

ui:
build:
context: autofl-ui/
dockerfile: ./docker/Dockerfile
image: cezarsas/autofl-ui:latest
ports:
- "8501:8501"
stdin_open: true # docker run -i
tty: true # docker run -t
volumes:
- type: bind
source: ./autofl-ui/
target: /autofl-ui
links:
- 'api:auto-fl'
30 changes: 21 additions & 9 deletions docker/Dockerfile
Original file line number Diff line number Diff line change
@@ -1,13 +1,25 @@
FROM python:3.10 as python-base
RUN mkdir autofl
WORKDIR /autofl
COPY pyproject.toml /autofl
RUN pip3 install poetry
RUN poetry config virtualenvs.create false
RUN poetry install -n --no-ansi --without dev
# Start with the official Python 3.10 image as base
FROM python:3.10 AS python-base

# Set working directory and copy pyproject.toml
WORKDIR /autofl
COPY pyproject.toml .

# Install poetry in a single layer and configure it
RUN pip install --no-cache-dir poetry \
&& poetry config virtualenvs.create false \
&& poetry install --no-root --no-ansi --without dev

# Copy the remaining application code
COPY . .

# Set environment variables
ENV PYTHONPATH=/autofl/src
ENV HYDRA_FULL_ERROR=1

HEALTHCHECK CMD curl --fail http://localhost:8000
# Define a health check command
HEALTHCHECK --interval=30s --timeout=10s --retries=3 \
CMD curl --fail http://localhost:8000 || exit 1

CMD ["gunicorn", "-w", "4", "-k", "uvicorn.workers.UvicornWorker", "api.main:app", "--bind", "0.0.0.0:8000", "--timeout", "100000"]
# Set the default command to start the app
CMD ["gunicorn", "-w", "4", "-k", "uvicorn.workers.UvicornWorker", "api.main:app", "--bind", "0.0.0.0:8000", "--timeout", "100000"]
2 changes: 1 addition & 1 deletion pyproject.toml
Original file line number Diff line number Diff line change
Expand Up @@ -25,7 +25,7 @@ more-itertools = "^10.2.0"
tree-sitter = "^0.20.4"
sqlalchemy = "^2.0.25"
psycopg = {extras = ["binary"], version = "^3.1.17"}
gensim = "^4.3.2"
gensim = "^4.3.3"
fasttext-wheel = "^0.9.2"
transformers = "^4.37.1"
sentence-transformers = "^2.2.2"
Expand Down
4 changes: 2 additions & 2 deletions src/annotation/similarity.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,8 +4,8 @@
from loguru import logger
from sklearn.metrics.pairwise import cosine_similarity

from embedding.embedding import AbstractEmbeddingModel
from entity.taxonomy import TaxonomyBase
from embedding import AbstractEmbeddingModel
from entity import TaxonomyBase
from annotation import LFBase


Expand Down
1 change: 1 addition & 0 deletions src/embedding/__init__.py
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
from .abstract import AbstractEmbeddingModel
File renamed without changes.
6 changes: 3 additions & 3 deletions src/embedding/ft.py
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
import fasttext as ft
import numpy
import numpy as np

from embedding.embedding import AbstractEmbeddingModel
from embedding.abstract import AbstractEmbeddingModel


class FastTextEmbedding(AbstractEmbeddingModel):
Expand All @@ -14,7 +14,7 @@ def __init__(self, path: str, model: str = 'fastText', split_camel: bool = False
self._name = f'{model}'
self.model = ft.load_model(path)

def get_embedding(self, text: str) -> numpy.ndarray:
def get_embedding(self, text: str) -> np.ndarray:
"""
Returns the embedding of the text.
:param text:
Expand Down
10 changes: 4 additions & 6 deletions src/embedding/gensim_w2v.py
Original file line number Diff line number Diff line change
@@ -1,9 +1,7 @@
import re

import numpy
import numpy as np
from gensim.models import KeyedVectors
from embedding.embedding import AbstractEmbeddingModel

from embedding import AbstractEmbeddingModel


class W2VEmbedding(AbstractEmbeddingModel):
Expand All @@ -16,7 +14,7 @@ def __init__(self, path: str, model: str = 'W2V-Unk', split_camel: bool = False)
self._name = f'{model}'
self.model = KeyedVectors.load_word2vec_format(path, binary=True)

def get_embedding(self, text: str) -> numpy.ndarray:
def get_embedding(self, text: str) -> np.ndarray:
"""
Returns the embedding of the text.
:param text:
Expand All @@ -30,4 +28,4 @@ def get_embedding(self, text: str) -> numpy.ndarray:
embeddings.append(self.model[word])
else:
embeddings.append(np.zeros(self.model.vector_size))
return numpy.mean(embeddings, axis=0)
return np.mean(embeddings, axis=0)
8 changes: 4 additions & 4 deletions src/embedding/huggingface.py
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
import numpy
import numpy as np
import torch

from embedding.embedding import AbstractEmbeddingModel
from embedding.abstract import AbstractEmbeddingModel
from sentence_transformers import SentenceTransformer
from transformers import BertModel, BertTokenizer

Expand All @@ -18,7 +18,7 @@ def __init__(self, name, model, split_camel: bool = False):
self.model = BertModel.from_pretrained(model)
self.tokenizer = BertTokenizer.from_pretrained(model, do_lower_case=do_lower_case)

def get_embedding(self, text: str) -> numpy.ndarray:
def get_embedding(self, text: str) -> np.ndarray:
"""
Returns the embedding of the text.
:param text:
Expand All @@ -39,7 +39,7 @@ def __init__(self, name, model, device='cpu', split_camel: bool = False):
self.model = SentenceTransformer(model, device=device)
self.model.tokenizer.add_special_tokens({'pad_token': '[PAD]'})

def get_embedding(self, text: str) -> numpy.ndarray:
def get_embedding(self, text: str) -> np.ndarray:
"""
Returns the embedding of the text.
:param text:
Expand Down
6 changes: 3 additions & 3 deletions src/embedding/spacy_bert.py
Original file line number Diff line number Diff line change
@@ -1,6 +1,6 @@
import numpy
import numpy as np

from embedding.embedding import AbstractEmbeddingModel
from embedding.abstract import AbstractEmbeddingModel


class BERTEmbedding(AbstractEmbeddingModel):
Expand All @@ -13,7 +13,7 @@ def __init__(self, model, split_camel: bool = False):
self._name = f'{model}'
self.model = spacy.load(model, disable=["ner", "textcat", "parser"])

def get_embedding(self, text: str) -> numpy.ndarray:
def get_embedding(self, text: str) -> np.ndarray:
"""
Returns the embedding of the text.
:param text:
Expand Down
1 change: 1 addition & 0 deletions src/entity/__init__.py
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
from .taxonomy import TaxonomyBase
2 changes: 0 additions & 2 deletions src/pipeline/pipeline.py
Original file line number Diff line number Diff line change
@@ -1,5 +1,4 @@
from abc import ABC
from pathlib import Path
from typing import List, Tuple

from loguru import logger
Expand All @@ -16,7 +15,6 @@ class PipelineBase(ABC):
def run(self, project: Project, version: Version) -> Tuple[Project, Version]:
pass


# TODO: Move to BATCH, and use the Execution pipeline
class BatchPipeline:
def __init__(self, pipeline: ExecutionBase,
Expand Down

0 comments on commit 4db2a0c

Please sign in to comment.