Skip to content

Commit f09c58f

Browse files
authored
Update FG document (#540)
1 parent ae3e855 commit f09c58f

File tree

15 files changed

+415
-39
lines changed

15 files changed

+415
-39
lines changed

docker/Dockerfile_paitf115

Lines changed: 36 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,36 @@
1+
FROM dsw-registry.cn-shanghai.cr.aliyuncs.com/pai/tensorflow-training:1.15PAI-cpu-py36-ubuntu18.04
2+
3+
COPY docker/sources_18.04.list /etc/apt/sources.list
4+
5+
# necessary for later commands to take effect
6+
RUN md5sum /etc/apt/sources.list
7+
8+
RUN apt-get update
9+
RUN apt-get install apt-utils inetutils-ping wget curl telnet vim strace libpq-dev curl libsasl2-dev gcc g++ unzip openjdk-8-jdk -y
10+
11+
RUN mkdir /EasyRec
12+
COPY requirements /EasyRec/requirements
13+
COPY requirements.txt /EasyRec/
14+
COPY easy_rec /EasyRec/easy_rec/
15+
COPY setup.cfg /EasyRec/
16+
COPY setup.py /EasyRec/
17+
COPY MANIFEST.in /EasyRec/
18+
COPY README.md /EasyRec/
19+
COPY scripts /EasyRec/scripts
20+
21+
RUN curl "http://easyrec.oss-cn-beijing.aliyuncs.com/tools/odpscmd_public_0.45.0.zip" -o /EasyRec/odpscmd_public.zip
22+
RUN mkdir /usr/local/odps_clt/ && cd /usr/local/odps_clt/ && unzip /EasyRec/odpscmd_public.zip
23+
RUN ln -s /usr/local/odps_clt/bin/odpscmd /usr/local/bin/odpscmd
24+
RUN pip3 install --upgrade pip
25+
RUN pip3 install pystack-debugger idna kafka-python -i http://mirrors.aliyun.com/pypi/simple --trusted-host mirrors.aliyun.com -i http://mirrors.aliyun.com/pypi/simple --trusted-host mirrors.aliyun.com
26+
RUN pip3 install -r /EasyRec/requirements/runtime.txt
27+
RUN pip3 install -r /EasyRec/requirements/extra.txt -i http://mirrors.aliyun.com/pypi/simple --trusted-host mirrors.aliyun.com
28+
RUN pip3 install http://easyrec.oss-cn-beijing.aliyuncs.com/3rdparty/graphlearn-1.1.0-cp36-cp36m-linux_x86_64.whl -i http://mirrors.aliyun.com/pypi/simple --trusted-host mirrors.aliyun.com
29+
RUN pip3 install http://easyrec.oss-cn-beijing.aliyuncs.com/releases/pai_automl-0.0.1rc1-py3-none-any.whl -i http://mirrors.aliyun.com/pypi/simple --trusted-host mirrors.aliyun.com
30+
RUN pip3 install https://easyrec.oss-cn-beijing.aliyuncs.com/3rdparty/common_io-0.4.2%2Btunnel-py2.py3-none-any.whl -i http://mirrors.aliyun.com/pypi/simple --trusted-host mirrors.aliyun.com
31+
RUN pip3 install tensorflow_probability==0.8 -i http://mirrors.aliyun.com/pypi/simple --trusted-host mirrors.aliyun.com
32+
RUN cd /EasyRec && pip install .
33+
RUN rm -rf /EasyRec
34+
RUN python -c "import easy_rec; easy_rec.help(); import pyhive; import datahub; import kafka"
35+
36+
COPY docker/hadoop_env.sh /opt/hadoop_env.sh

docker/Dockerfile_tf211

Lines changed: 36 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,36 @@
1+
FROM dsw-registry.cn-shanghai.cr.aliyuncs.com/pai/tensorflow:2.11-cpu-py39-ubuntu20.04-1
2+
COPY docker/sources_20.04.list /etc/apt/sources.list
3+
4+
# necessary for later commands to take effect
5+
RUN md5sum /etc/apt/sources.list
6+
7+
RUN apt-get update
8+
RUN apt-get install apt-utils inetutils-ping wget curl telnet vim strace libpq-dev curl libsasl2-dev gcc g++ unzip openjdk-8-jdk -y
9+
10+
RUN mkdir /EasyRec
11+
COPY requirements /EasyRec/requirements
12+
COPY requirements.txt /EasyRec/
13+
COPY easy_rec /EasyRec/easy_rec/
14+
COPY setup.cfg /EasyRec/
15+
COPY setup.py /EasyRec/
16+
COPY MANIFEST.in /EasyRec/
17+
COPY README.md /EasyRec/
18+
COPY scripts /EasyRec/scripts
19+
20+
RUN curl "http://easyrec.oss-cn-beijing.aliyuncs.com/tools/odpscmd_public_0.45.0.zip" -o /EasyRec/odpscmd_public.zip
21+
RUN mkdir /usr/local/odps_clt/ && cd /usr/local/odps_clt/ && unzip /EasyRec/odpscmd_public.zip
22+
RUN ln -s /usr/local/odps_clt/bin/odpscmd /usr/local/bin/odpscmd
23+
RUN python -m pip install --upgrade pip
24+
RUN pip3 install pystack-debugger idna kafka-python -i http://mirrors.aliyun.com/pypi/simple --trusted-host mirrors.aliyun.com -i http://mirrors.aliyun.com/pypi/simple --trusted-host mirrors.aliyun.com
25+
RUN pip3 install -r /EasyRec/requirements/runtime.txt -i http://mirrors.aliyun.com/pypi/simple --trusted-host mirrors.aliyun.com
26+
RUN pip3 install -r /EasyRec/requirements/extra.txt -i http://mirrors.aliyun.com/pypi/simple --trusted-host mirrors.aliyun.com
27+
RUN pip3 install https://tzrec.oss-cn-beijing.aliyuncs.com/third_party/graphlearn-1.2.0-cp39-cp39-linux_x86_64.whl -i http://mirrors.aliyun.com/pypi/simple --trusted-host mirrors.aliyun.com
28+
# RUN pip3 install http://easyrec.oss-cn-beijing.aliyuncs.com/releases/pai_automl-0.0.1rc1-py3-none-any.whl -i http://mirrors.aliyun.com/pypi/simple --trusted-host mirrors.aliyun.com
29+
RUN pip3 install tensorflow_probability==0.19.0 -i http://mirrors.aliyun.com/pypi/simple --trusted-host mirrors.aliyun.com
30+
#RUN pip3 install encodings
31+
RUN pip3 install https://easyrec.oss-cn-beijing.aliyuncs.com/3rdparty/common_io-0.4.j2%2Btunnel-py2.py3-none-any.whl -i http://mirrors.aliyun.com/pypi/simple --trusted-host mirrors.aliyun.com
32+
RUN cd /EasyRec && pip install .
33+
RUN rm -rf /EasyRec
34+
# RUN python -c "import easy_rec; easy_rec.help(); import pyhive; import datahub; import kafka"
35+
36+
COPY docker/hadoop_env.sh /opt/hadoop_env.sh

docs/images/other/fg.svg

Lines changed: 1 addition & 0 deletions
Loading

docs/source/feature/feature.rst

Lines changed: 0 additions & 21 deletions
Original file line numberDiff line numberDiff line change
@@ -462,27 +462,6 @@ ExprFeature:表达式特征
462462
- 当前版本未定义"&","|"的符号优先级,建议使用括号保证优先级。
463463
- customized normalization: "tf.math.log1p(user_age) / 10.0"
464464

465-
EmbeddingVariable
466-
----------------------------------------------------------------
467-
Key Value Hash, 减少hash冲突, 支持特征准入和特征淘汰。
468-
469-
.. code:: protobuf
470-
471-
model_config {
472-
model_class: "MultiTower"
473-
...
474-
ev_params {
475-
filter_freq: 2
476-
}
477-
}
478-
- 配置方式:
479-
- feature_config单独配置ev_params
480-
- model_config里面统一配置ev_params
481-
482-
- ev_params : EVParams
483-
- filter_freq: 频次过滤, 低频特征噪声大,过滤噪声让模型更鲁棒
484-
- steps_to_live: 特征淘汰, 淘汰过期特征,防止模型过大
485-
- Note: 仅在安装PAI-TF/DeepRec时可用
486465

487466
特征选择
488467
----------------------------------------------------------------

0 commit comments

Comments
 (0)