Skip to content
This repository has been archived by the owner on Jul 18, 2024. It is now read-only.

Commit

Permalink
Merge pull request #505 from xuechendi/main
Browse files Browse the repository at this point in the history
[v1.2]add copyright to all new components
  • Loading branch information
xuechendi authored Dec 22, 2023
2 parents 1d14211 + ae95394 commit 5398747
Show file tree
Hide file tree
Showing 176 changed files with 2,717 additions and 223 deletions.
16 changes: 16 additions & 0 deletions RecDP/pyrecdp/LLM/TextPipeline.py
Original file line number Diff line number Diff line change
@@ -1,3 +1,19 @@
"""
Copyright 2024 Intel Corporation
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
https://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
"""

from pyrecdp.core.di_graph import DiGraph
from pyrecdp.core.pipeline import BasePipeline
from pyrecdp.primitives.operations import Operation, BaseOperation
Expand Down
16 changes: 16 additions & 0 deletions RecDP/pyrecdp/LLM/__init__.py
Original file line number Diff line number Diff line change
@@ -1,3 +1,19 @@
"""
Copyright 2024 Intel Corporation
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
https://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
"""

from pyrecdp.core.import_utils import check_availability_and_install, list_requirements

import os, pathlib
Expand Down
16 changes: 16 additions & 0 deletions RecDP/pyrecdp/__init__.py
Original file line number Diff line number Diff line change
@@ -1,3 +1,19 @@
"""
Copyright 2024 Intel Corporation
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
https://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
"""

import os, sys
from pathlib import Path
try:
Expand Down
16 changes: 16 additions & 0 deletions RecDP/pyrecdp/autofe/AutoFE.py
Original file line number Diff line number Diff line change
@@ -1,3 +1,19 @@
"""
Copyright 2024 Intel Corporation
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
https://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
"""

import logging
from pyrecdp.core.utils import Timer, infer_problem_type
from pyrecdp.core.dataframe import DataFrameAPI
Expand Down
16 changes: 16 additions & 0 deletions RecDP/pyrecdp/autofe/FeatureEstimator.py
Original file line number Diff line number Diff line change
@@ -1,3 +1,19 @@
"""
Copyright 2024 Intel Corporation
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
https://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
"""

from pyrecdp.primitives.generators import *
from pyrecdp.autofe.TabularPipeline import TabularPipeline
import logging
Expand Down
16 changes: 16 additions & 0 deletions RecDP/pyrecdp/autofe/FeatureProfiler.py
Original file line number Diff line number Diff line change
@@ -1,3 +1,19 @@
"""
Copyright 2024 Intel Corporation
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
https://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
"""

from jinja2 import Environment, PackageLoader
from pyrecdp.primitives.profilers import *
from pyrecdp.primitives.generators import *
Expand Down
16 changes: 16 additions & 0 deletions RecDP/pyrecdp/autofe/FeatureWrangler.py
Original file line number Diff line number Diff line change
@@ -1,3 +1,19 @@
"""
Copyright 2024 Intel Corporation
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
https://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
"""

from pyrecdp.primitives.generators import *
from pyrecdp.primitives.profilers import *
from pyrecdp.autofe.TabularPipeline import TabularPipeline
Expand Down
16 changes: 16 additions & 0 deletions RecDP/pyrecdp/autofe/RelationalBuilder.py
Original file line number Diff line number Diff line change
@@ -1,3 +1,19 @@
"""
Copyright 2024 Intel Corporation
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
https://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
"""

from pyrecdp.primitives.generators import *
from pyrecdp.primitives.profilers import *
from pyrecdp.autofe.TabularPipeline import TabularPipeline
Expand Down
16 changes: 16 additions & 0 deletions RecDP/pyrecdp/autofe/TabularPipeline.py
Original file line number Diff line number Diff line change
@@ -1,3 +1,19 @@
"""
Copyright 2024 Intel Corporation
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
https://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
"""

from pyrecdp.primitives.generators import *
from pyrecdp.core.schema import DataFrameSchema
from pyrecdp.core.di_graph import DiGraph
Expand Down
16 changes: 16 additions & 0 deletions RecDP/pyrecdp/autofe/__init__.py
Original file line number Diff line number Diff line change
@@ -1,3 +1,19 @@
"""
Copyright 2024 Intel Corporation
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
https://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
"""

from pyrecdp.core.import_utils import check_availability_and_install, list_requirements

import os, pathlib
Expand Down
16 changes: 16 additions & 0 deletions RecDP/pyrecdp/core/__init__.py
Original file line number Diff line number Diff line change
@@ -1 +1,17 @@
"""
Copyright 2024 Intel Corporation
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
https://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
"""

from pyrecdp.data_processor import DataProcessor as SparkDataProcessor
16 changes: 16 additions & 0 deletions RecDP/pyrecdp/core/cache_utils.py
Original file line number Diff line number Diff line change
@@ -1,3 +1,19 @@
"""
Copyright 2024 Intel Corporation
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
https://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
"""

import os

# Default cache location
Expand Down
16 changes: 16 additions & 0 deletions RecDP/pyrecdp/core/class_utils.py
Original file line number Diff line number Diff line change
@@ -1,3 +1,19 @@
"""
Copyright 2024 Intel Corporation
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
https://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
"""


def new_instance(module, clazz, **clazz_kwargs):
import importlib
Expand Down
16 changes: 16 additions & 0 deletions RecDP/pyrecdp/core/dataframe.py
Original file line number Diff line number Diff line change
@@ -1,3 +1,19 @@
"""
Copyright 2024 Intel Corporation
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
https://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
"""

import pandas as pd

class DataFrameAPI:
Expand Down
16 changes: 16 additions & 0 deletions RecDP/pyrecdp/core/di_graph.py
Original file line number Diff line number Diff line change
@@ -1,3 +1,19 @@
"""
Copyright 2024 Intel Corporation
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
https://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
"""

from collections import defaultdict

class Graph:
Expand Down
16 changes: 16 additions & 0 deletions RecDP/pyrecdp/core/import_utils.py
Original file line number Diff line number Diff line change
@@ -1,3 +1,19 @@
"""
Copyright 2024 Intel Corporation
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
https://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
"""

import os
from typing import Optional
import pip
Expand Down
16 changes: 16 additions & 0 deletions RecDP/pyrecdp/core/model_utils.py
Original file line number Diff line number Diff line change
@@ -1,3 +1,19 @@
"""
Copyright 2024 Intel Corporation
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
https://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
"""

""" This code is adapted from Alibaba data-juicer
https://github.com/alibaba/data-juicer/blob/main/data_juicer/utils/model_utils.py
"""
Expand Down
16 changes: 16 additions & 0 deletions RecDP/pyrecdp/core/parallel_iterator.py
Original file line number Diff line number Diff line change
@@ -1,3 +1,19 @@
"""
Copyright 2024 Intel Corporation
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
https://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
"""

from concurrent.futures import ThreadPoolExecutor, ProcessPoolExecutor
import multiprocessing
from multiprocessing.pool import ThreadPool
Expand Down
16 changes: 16 additions & 0 deletions RecDP/pyrecdp/core/pipeline.py
Original file line number Diff line number Diff line change
@@ -1,3 +1,19 @@
"""
Copyright 2024 Intel Corporation
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
https://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
"""

from pyrecdp.core.di_graph import DiGraph
from pyrecdp.primitives.operations import Operation
import logging
Expand Down
16 changes: 16 additions & 0 deletions RecDP/pyrecdp/core/registry.py
Original file line number Diff line number Diff line change
@@ -1,3 +1,19 @@
"""
Copyright 2024 Intel Corporation
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
https://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
"""

class Registry(object):
def __init__(self, registry_name):
self._name = registry_name
Expand Down
Loading

0 comments on commit 5398747

Please sign in to comment.