Skip to content

Commit

Permalink
Merge branch 'dev' into transform-pipeline
Browse files Browse the repository at this point in the history
  • Loading branch information
daw3rd committed Sep 20, 2024
2 parents 8fc7637 + eba80df commit 68a1f7e
Show file tree
Hide file tree
Showing 23 changed files with 67 additions and 23 deletions.
4 changes: 3 additions & 1 deletion .github/workflows/test-code-code2parquet.yml
Original file line number Diff line number Diff line change
Expand Up @@ -102,7 +102,9 @@ jobs:
- name: Test transform image in transforms/code/code2parquet
run: |
if [ -e "transforms/code/code2parquet/Makefile" ]; then
make -C data-processing-lib/spark DOCKER=docker image
if [ -d "transforms/code/code2parquet/spark" ]; then
make -C data-processing-lib/spark DOCKER=docker image
fi
make -C transforms/code/code2parquet DOCKER=docker test-image
else
echo "transforms/code/code2parquet/Makefile not found - testing disabled for this transform."
Expand Down
4 changes: 3 additions & 1 deletion .github/workflows/test-code-code_quality.yml
Original file line number Diff line number Diff line change
Expand Up @@ -102,7 +102,9 @@ jobs:
- name: Test transform image in transforms/code/code_quality
run: |
if [ -e "transforms/code/code_quality/Makefile" ]; then
make -C data-processing-lib/spark DOCKER=docker image
if [ -d "transforms/code/code_quality/spark" ]; then
make -C data-processing-lib/spark DOCKER=docker image
fi
make -C transforms/code/code_quality DOCKER=docker test-image
else
echo "transforms/code/code_quality/Makefile not found - testing disabled for this transform."
Expand Down
4 changes: 3 additions & 1 deletion .github/workflows/test-code-header_cleanser.yml
Original file line number Diff line number Diff line change
Expand Up @@ -102,7 +102,9 @@ jobs:
- name: Test transform image in transforms/code/header_cleanser
run: |
if [ -e "transforms/code/header_cleanser/Makefile" ]; then
make -C data-processing-lib/spark DOCKER=docker image
if [ -d "transforms/code/header_cleanser/spark" ]; then
make -C data-processing-lib/spark DOCKER=docker image
fi
make -C transforms/code/header_cleanser DOCKER=docker test-image
else
echo "transforms/code/header_cleanser/Makefile not found - testing disabled for this transform."
Expand Down
4 changes: 3 additions & 1 deletion .github/workflows/test-code-malware.yml
Original file line number Diff line number Diff line change
Expand Up @@ -102,7 +102,9 @@ jobs:
- name: Test transform image in transforms/code/malware
run: |
if [ -e "transforms/code/malware/Makefile" ]; then
make -C data-processing-lib/spark DOCKER=docker image
if [ -d "transforms/code/malware/spark" ]; then
make -C data-processing-lib/spark DOCKER=docker image
fi
make -C transforms/code/malware DOCKER=docker test-image
else
echo "transforms/code/malware/Makefile not found - testing disabled for this transform."
Expand Down
4 changes: 3 additions & 1 deletion .github/workflows/test-code-proglang_select.yml
Original file line number Diff line number Diff line change
Expand Up @@ -102,7 +102,9 @@ jobs:
- name: Test transform image in transforms/code/proglang_select
run: |
if [ -e "transforms/code/proglang_select/Makefile" ]; then
make -C data-processing-lib/spark DOCKER=docker image
if [ -d "transforms/code/proglang_select/spark" ]; then
make -C data-processing-lib/spark DOCKER=docker image
fi
make -C transforms/code/proglang_select DOCKER=docker test-image
else
echo "transforms/code/proglang_select/Makefile not found - testing disabled for this transform."
Expand Down
4 changes: 3 additions & 1 deletion .github/workflows/test-code-repo_level_ordering.yml
Original file line number Diff line number Diff line change
Expand Up @@ -102,7 +102,9 @@ jobs:
- name: Test transform image in transforms/code/repo_level_ordering
run: |
if [ -e "transforms/code/repo_level_ordering/Makefile" ]; then
make -C data-processing-lib/spark DOCKER=docker image
if [ -d "transforms/code/repo_level_ordering/spark" ]; then
make -C data-processing-lib/spark DOCKER=docker image
fi
make -C transforms/code/repo_level_ordering DOCKER=docker test-image
else
echo "transforms/code/repo_level_ordering/Makefile not found - testing disabled for this transform."
Expand Down
4 changes: 3 additions & 1 deletion .github/workflows/test-language-doc_chunk.yml
Original file line number Diff line number Diff line change
Expand Up @@ -102,7 +102,9 @@ jobs:
- name: Test transform image in transforms/language/doc_chunk
run: |
if [ -e "transforms/language/doc_chunk/Makefile" ]; then
make -C data-processing-lib/spark DOCKER=docker image
if [ -d "transforms/language/doc_chunk/spark" ]; then
make -C data-processing-lib/spark DOCKER=docker image
fi
make -C transforms/language/doc_chunk DOCKER=docker test-image
else
echo "transforms/language/doc_chunk/Makefile not found - testing disabled for this transform."
Expand Down
4 changes: 3 additions & 1 deletion .github/workflows/test-language-doc_quality.yml
Original file line number Diff line number Diff line change
Expand Up @@ -102,7 +102,9 @@ jobs:
- name: Test transform image in transforms/language/doc_quality
run: |
if [ -e "transforms/language/doc_quality/Makefile" ]; then
make -C data-processing-lib/spark DOCKER=docker image
if [ -d "transforms/language/doc_quality/spark" ]; then
make -C data-processing-lib/spark DOCKER=docker image
fi
make -C transforms/language/doc_quality DOCKER=docker test-image
else
echo "transforms/language/doc_quality/Makefile not found - testing disabled for this transform."
Expand Down
4 changes: 3 additions & 1 deletion .github/workflows/test-language-lang_id.yml
Original file line number Diff line number Diff line change
Expand Up @@ -102,7 +102,9 @@ jobs:
- name: Test transform image in transforms/language/lang_id
run: |
if [ -e "transforms/language/lang_id/Makefile" ]; then
make -C data-processing-lib/spark DOCKER=docker image
if [ -d "transforms/language/lang_id/spark" ]; then
make -C data-processing-lib/spark DOCKER=docker image
fi
make -C transforms/language/lang_id DOCKER=docker test-image
else
echo "transforms/language/lang_id/Makefile not found - testing disabled for this transform."
Expand Down
4 changes: 3 additions & 1 deletion .github/workflows/test-language-pdf2parquet.yml
Original file line number Diff line number Diff line change
Expand Up @@ -102,7 +102,9 @@ jobs:
- name: Test transform image in transforms/language/pdf2parquet
run: |
if [ -e "transforms/language/pdf2parquet/Makefile" ]; then
make -C data-processing-lib/spark DOCKER=docker image
if [ -d "transforms/language/pdf2parquet/spark" ]; then
make -C data-processing-lib/spark DOCKER=docker image
fi
make -C transforms/language/pdf2parquet DOCKER=docker test-image
else
echo "transforms/language/pdf2parquet/Makefile not found - testing disabled for this transform."
Expand Down
4 changes: 3 additions & 1 deletion .github/workflows/test-language-pii_redactor.yml
Original file line number Diff line number Diff line change
Expand Up @@ -102,7 +102,9 @@ jobs:
- name: Test transform image in transforms/language/pii_redactor
run: |
if [ -e "transforms/language/pii_redactor/Makefile" ]; then
make -C data-processing-lib/spark DOCKER=docker image
if [ -d "transforms/language/pii_redactor/spark" ]; then
make -C data-processing-lib/spark DOCKER=docker image
fi
make -C transforms/language/pii_redactor DOCKER=docker test-image
else
echo "transforms/language/pii_redactor/Makefile not found - testing disabled for this transform."
Expand Down
4 changes: 3 additions & 1 deletion .github/workflows/test-language-text_encoder.yml
Original file line number Diff line number Diff line change
Expand Up @@ -102,7 +102,9 @@ jobs:
- name: Test transform image in transforms/language/text_encoder
run: |
if [ -e "transforms/language/text_encoder/Makefile" ]; then
make -C data-processing-lib/spark DOCKER=docker image
if [ -d "transforms/language/text_encoder/spark" ]; then
make -C data-processing-lib/spark DOCKER=docker image
fi
make -C transforms/language/text_encoder DOCKER=docker test-image
else
echo "transforms/language/text_encoder/Makefile not found - testing disabled for this transform."
Expand Down
4 changes: 3 additions & 1 deletion .github/workflows/test-transform.template
Original file line number Diff line number Diff line change
Expand Up @@ -102,7 +102,9 @@ jobs:
- name: Test transform image in @TARGET_TRANSFORM_DIR@
run: |
if [ -e "@TARGET_TRANSFORM_DIR@/Makefile" ]; then
make -C data-processing-lib/spark DOCKER=docker image
if [ -d "@TARGET_TRANSFORM_DIR@/spark" ]; then
make -C data-processing-lib/spark DOCKER=docker image
fi
make -C @TARGET_TRANSFORM_DIR@ DOCKER=docker test-image
else
echo "@TARGET_TRANSFORM_DIR@/Makefile not found - testing disabled for this transform."
Expand Down
4 changes: 3 additions & 1 deletion .github/workflows/test-universal-doc_id.yml
Original file line number Diff line number Diff line change
Expand Up @@ -102,7 +102,9 @@ jobs:
- name: Test transform image in transforms/universal/doc_id
run: |
if [ -e "transforms/universal/doc_id/Makefile" ]; then
make -C data-processing-lib/spark DOCKER=docker image
if [ -d "transforms/universal/doc_id/spark" ]; then
make -C data-processing-lib/spark DOCKER=docker image
fi
make -C transforms/universal/doc_id DOCKER=docker test-image
else
echo "transforms/universal/doc_id/Makefile not found - testing disabled for this transform."
Expand Down
4 changes: 3 additions & 1 deletion .github/workflows/test-universal-ededup.yml
Original file line number Diff line number Diff line change
Expand Up @@ -102,7 +102,9 @@ jobs:
- name: Test transform image in transforms/universal/ededup
run: |
if [ -e "transforms/universal/ededup/Makefile" ]; then
make -C data-processing-lib/spark DOCKER=docker image
if [ -d "transforms/universal/ededup/spark" ]; then
make -C data-processing-lib/spark DOCKER=docker image
fi
make -C transforms/universal/ededup DOCKER=docker test-image
else
echo "transforms/universal/ededup/Makefile not found - testing disabled for this transform."
Expand Down
4 changes: 3 additions & 1 deletion .github/workflows/test-universal-fdedup.yml
Original file line number Diff line number Diff line change
Expand Up @@ -102,7 +102,9 @@ jobs:
- name: Test transform image in transforms/universal/fdedup
run: |
if [ -e "transforms/universal/fdedup/Makefile" ]; then
make -C data-processing-lib/spark DOCKER=docker image
if [ -d "transforms/universal/fdedup/spark" ]; then
make -C data-processing-lib/spark DOCKER=docker image
fi
make -C transforms/universal/fdedup DOCKER=docker test-image
else
echo "transforms/universal/fdedup/Makefile not found - testing disabled for this transform."
Expand Down
4 changes: 3 additions & 1 deletion .github/workflows/test-universal-filter.yml
Original file line number Diff line number Diff line change
Expand Up @@ -102,7 +102,9 @@ jobs:
- name: Test transform image in transforms/universal/filter
run: |
if [ -e "transforms/universal/filter/Makefile" ]; then
make -C data-processing-lib/spark DOCKER=docker image
if [ -d "transforms/universal/filter/spark" ]; then
make -C data-processing-lib/spark DOCKER=docker image
fi
make -C transforms/universal/filter DOCKER=docker test-image
else
echo "transforms/universal/filter/Makefile not found - testing disabled for this transform."
Expand Down
4 changes: 3 additions & 1 deletion .github/workflows/test-universal-html2parquet.yml
Original file line number Diff line number Diff line change
Expand Up @@ -102,7 +102,9 @@ jobs:
- name: Test transform image in transforms/universal/html2parquet
run: |
if [ -e "transforms/universal/html2parquet/Makefile" ]; then
make -C data-processing-lib/spark DOCKER=docker image
if [ -d "transforms/universal/html2parquet/spark" ]; then
make -C data-processing-lib/spark DOCKER=docker image
fi
make -C transforms/universal/html2parquet DOCKER=docker test-image
else
echo "transforms/universal/html2parquet/Makefile not found - testing disabled for this transform."
Expand Down
4 changes: 3 additions & 1 deletion .github/workflows/test-universal-noop.yml
Original file line number Diff line number Diff line change
Expand Up @@ -102,7 +102,9 @@ jobs:
- name: Test transform image in transforms/universal/noop
run: |
if [ -e "transforms/universal/noop/Makefile" ]; then
make -C data-processing-lib/spark DOCKER=docker image
if [ -d "transforms/universal/noop/spark" ]; then
make -C data-processing-lib/spark DOCKER=docker image
fi
make -C transforms/universal/noop DOCKER=docker test-image
else
echo "transforms/universal/noop/Makefile not found - testing disabled for this transform."
Expand Down
4 changes: 3 additions & 1 deletion .github/workflows/test-universal-profiler.yml
Original file line number Diff line number Diff line change
Expand Up @@ -102,7 +102,9 @@ jobs:
- name: Test transform image in transforms/universal/profiler
run: |
if [ -e "transforms/universal/profiler/Makefile" ]; then
make -C data-processing-lib/spark DOCKER=docker image
if [ -d "transforms/universal/profiler/spark" ]; then
make -C data-processing-lib/spark DOCKER=docker image
fi
make -C transforms/universal/profiler DOCKER=docker test-image
else
echo "transforms/universal/profiler/Makefile not found - testing disabled for this transform."
Expand Down
4 changes: 3 additions & 1 deletion .github/workflows/test-universal-resize.yml
Original file line number Diff line number Diff line change
Expand Up @@ -102,7 +102,9 @@ jobs:
- name: Test transform image in transforms/universal/resize
run: |
if [ -e "transforms/universal/resize/Makefile" ]; then
make -C data-processing-lib/spark DOCKER=docker image
if [ -d "transforms/universal/resize/spark" ]; then
make -C data-processing-lib/spark DOCKER=docker image
fi
make -C transforms/universal/resize DOCKER=docker test-image
else
echo "transforms/universal/resize/Makefile not found - testing disabled for this transform."
Expand Down
4 changes: 3 additions & 1 deletion .github/workflows/test-universal-tokenization.yml
Original file line number Diff line number Diff line change
Expand Up @@ -102,7 +102,9 @@ jobs:
- name: Test transform image in transforms/universal/tokenization
run: |
if [ -e "transforms/universal/tokenization/Makefile" ]; then
make -C data-processing-lib/spark DOCKER=docker image
if [ -d "transforms/universal/tokenization/spark" ]; then
make -C data-processing-lib/spark DOCKER=docker image
fi
make -C transforms/universal/tokenization DOCKER=docker test-image
else
echo "transforms/universal/tokenization/Makefile not found - testing disabled for this transform."
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -27,5 +27,5 @@ def __init__(self):

if __name__ == "__main__":
launcher = PythonTransformLauncher(HeaderCleanserPythonTransformConfiguration())
logger.info("Launching license copyright header removal")
logger.info("Launching license copyright header removal.")
launcher.launch()

0 comments on commit 68a1f7e

Please sign in to comment.