From 7d5e15c10ceab7cc67a9870624e7fecf515c3ea3 Mon Sep 17 00:00:00 2001 From: truskovskiyk Date: Mon, 8 Jul 2024 21:49:21 -0400 Subject: [PATCH] clean --- .github/workflows/module-3.yaml | 32 +++----------------------------- module-3/README.md | 32 ++++++++++++++++++++------------ 2 files changed, 23 insertions(+), 41 deletions(-) diff --git a/.github/workflows/module-3.yaml b/.github/workflows/module-3.yaml index da72d69..73d86a9 100644 --- a/.github/workflows/module-3.yaml +++ b/.github/workflows/module-3.yaml @@ -22,21 +22,16 @@ jobs: test: runs-on: ubuntu-latest steps: - - name: Checkout - uses: actions/checkout@v2 - - name: Login to Docker Hub - uses: docker/login-action@v1 - with: - username: ${{ secrets.DOCKER_HUB_USERNAME }} - password: ${{ secrets.DOCKER_HUB_ACCESS_TOKEN }} + - name: Checkout + uses: actions/checkout@v4 - name: Set up Docker Buildx uses: docker/setup-buildx-action@v1 - name: Build new run: | - docker build -f week-3/nlp-sample/Dockerfile -t nlp-sample:latest week-3/nlp-sample + docker build -f module-3/nlp-sample/Dockerfile -t nlp-sample:latest module-3/nlp-sample - name: Test style run: | @@ -67,24 +62,3 @@ jobs: # tags: ${{ secrets.DOCKER_HUB_USERNAME }}/${{ env.IMAGE_MAIN_NAME }}:${{ env.IMAGE_MAIN_TAG }} # cache-from: type=registry,ref=${{ secrets.DOCKER_HUB_USERNAME }}/${{ env.IMAGE_MAIN_NAME }}:buildcache # cache-to: type=registry,ref=${{ secrets.DOCKER_HUB_USERNAME }}/${{ env.IMAGE_MAIN_NAME }}:buildcache,mode=max - - cml-test: - - runs-on: ubuntu-latest - steps: - - uses: actions/checkout@v2 - - - uses: iterative/setup-cml@v1 - - - name: Train model - run: | - docker build -f week-3/nlp-sample/Dockerfile -t nlp-sample:latest week-3/nlp-sample - docker run -v $PWD:/tmp/results -e WANDB_PROJECT=${{ secrets.WANDB_PROJECT }} -e WANDB_API_KEY=${{ secrets.WANDB_API_KEY }} nlp-sample:latest make train_fast_ci - - - name: Write CML report - env: - REPO_TOKEN: ${{ secrets.GITHUB_TOKEN }} - run: | - # Post reports as comments in GitHub PRs - # cat results.txt >> report.md - cml send-comment README.md diff --git a/module-3/README.md b/module-3/README.md index ab4d67b..33633c3 100644 --- a/module-3/README.md +++ b/module-3/README.md @@ -18,6 +18,11 @@ - [ML project](https://github.com/ashleve/lightning-hydra-template.git) - [Advanced features](https://github.com/Lightning-AI/lightning) +## Styling + +[ruff](https://github.com/astral-sh/ruff) + + ## Configuration [hydra](https://hydra.cc/docs/intro/) @@ -33,26 +38,29 @@ https://neptune.ai/blog/best-ml-experiment-tracking-tools - [GPT-4o](https://openai.com/index/hello-gpt-4o/) - [GPT-4 System Card](https://cdn.openai.com/papers/gpt-4-system-card.pdf) -## Classic example Example ML model with testing: BERT-based training +## Classic example: BERT-based training [nlp-sample](./nlp-sample) +## Modern example: GenAI-based training + +TODO -## Eval: +https://huggingface.co/microsoft/Phi-3-mini-128k-instruct/tree/main +https://github.com/microsoft/Phi-3CookBook +https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard -- https://github.com/explodinggradients/ragas -- https://github.com/NVIDIA/NeMo-Guardrails -- https://github.com/guardrail-ml/guardrail -- https://github.com/promptfoo/promptfoo -- https://github.com/confident-ai/deepeval +## GenAI testing: -``` -pip install nemoguardrails -pip install openai -export OPENAI_API_KEY=********** -``` +- [deepeval](https://github.com/confident-ai/deepeval) +- [LLM Testing in 2024: Top Methods and Strategies](https://www.confident-ai.com/blog/llm-testing-in-2024-top-methods-and-strategies) +- [promptfoo](https://github.com/promptfoo/promptfoo) +- [uptrain](https://github.com/uptrain-ai/uptrain) +- [ragas](https://github.com/explodinggradients/ragas) +- [NeMo Guardrails](https://github.com/NVIDIA/NeMo-Guardrails) +- [Automated Unit Test Improvement using Large Language Models at Meta](https://arxiv.org/abs/2402.09171)