add workflow CRM标签信息,dev

This commit is contained in:
root 2024-07-09 16:44:53 +08:00
parent 13c9fb9207
commit 2591c018e4
6 changed files with 293 additions and 0 deletions

View File

@ -0,0 +1,70 @@
#!/usr/bin/python
# -*- encoding=utf-8 -*-
from airflow import DAG
from datetime import datetime, timedelta
from airflow.contrib.hooks.ssh_hook import SSHHook
from airflow.contrib.operators.ssh_operator import SSHOperator
from airflow.sensors.external_task_sensor import ExternalTaskSensor
import json
from airflow.operators.trigger_dagrun import TriggerDagRunOperator
from airflow.operators.email_operator import EmailOperator
from airflow.utils.trigger_rule import TriggerRule
sshHook = SSHHook(ssh_conn_id ='ssh_air')
default_args = {
'owner': 'info@idgvalue.com',
'email_on_failure': True,
'email_on_retry':True,
'start_date': datetime(2024, 1, 1),
'depends_on_past': False,
'retries': 6,
'retry_delay': timedelta(minutes=10),
}
dag = DAG('wf_dag_crm_tags', default_args=default_args,
schedule_interval="0 0-23/1 * * *",
catchup=False,
dagrun_timeout=timedelta(minutes=160),
max_active_runs=3)
task_failed = EmailOperator (
dag=dag,
trigger_rule=TriggerRule.ONE_FAILED,
task_id="task_failed",
to=["info@idgvalue.com"],
cc=[""],
subject="crm_tags_failed",
html_content='<h3>您好crm_tags作业失败请及时处理" </h3>')
huiju_tags_feign = SSHOperator(
ssh_hook=sshHook,
task_id='huiju_tags_feign',
command='python3 /data/airflow/etl/API/huiju_tags_feign.py',
depends_on_past=False,
retries=3,
dag=dag)
huiju_tags_load = SSHOperator(
ssh_hook=sshHook,
task_id='huiju_tags_load',
command='/data/airflow/etl/API/run_psql.sh {{ ds_nodash }} {{params.my_param }}',
params={'my_param':"huiju_tags_load"},
depends_on_past=False,
retries=3,
dag=dag)
huiju_tags_feign >> huiju_tags_load
crm_tags_1237 = SSHOperator(
ssh_hook=sshHook,
task_id='crm_tags_1237',
command='/data/airflow/etl/SA/run_sa.sh {{ ds_nodash }} {{ params.my_param }} >>/data/airflow/logs/run_psql_{{ds_nodash}}.log 2>&1 ',
params={'my_param':"S98_S_crm_tags"},
depends_on_past=False,
retries=3,
dag=dag)
huiju_tags_load >> crm_tags_1237
crm_tags_1237 >> task_failed

View File

@ -0,0 +1,46 @@
/*******Main Section**************************************************************************/
\set ON_ERROR_STOP on
\set AUTOCOMMIT on
\timing on
delete from p10_sa.S98_S_crm_tags
;
insert into p10_sa.S98_S_crm_tags
( id
, name
, group_name
, type
, date_created
, last_updated
, etl_tx_dt )
select
id
, name
, group_name
, type
, date_created
, last_updated
, etl_tx_dt
from p00_tal.S98_S_crm_tags
;
delete from p12_sfull.S98_S_crm_tags
;
;
insert into p12_sfull.S98_S_crm_tags
( id
, name
, group_name
, type
, date_created
, last_updated
, etl_tx_dt )
select
id
, name
, group_name
, type
, date_created
, last_updated
, etl_tx_dt
from p10_sa.S98_S_crm_tags
;
\q

View File

@ -0,0 +1,18 @@
CREATE FOREIGN TABLE if not exists p00_tal.S98_S_crm_tags (
id TEXT
, name TEXT
, group_name TEXT
, type TEXT
, date_created TEXT
, last_updated TEXT
, etl_tx_dt TIMESTAMP
)
SERVER pgsql_server_S98_S OPTIONS(schema_name 'data_api', table_name 'crm_tags' );

View File

@ -0,0 +1,43 @@
create table if not exists p10_sa.S98_S_crm_tags (
id TEXT
, name TEXT
, group_name TEXT
, type TEXT
, date_created TEXT
, last_updated TEXT
, etl_tx_dt TIMESTAMP
) ;
COMMENT ON COLUMN p10_sa.S98_S_crm_tags.id IS '标签对应Id';
COMMENT ON COLUMN p10_sa.S98_S_crm_tags.name IS '标签名';
COMMENT ON COLUMN p10_sa.S98_S_crm_tags.group_name IS '标签分组名';
COMMENT ON COLUMN p10_sa.S98_S_crm_tags.type IS '标签类型';
COMMENT ON COLUMN p10_sa.S98_S_crm_tags.date_created IS '创建时间';
COMMENT ON COLUMN p10_sa.S98_S_crm_tags.last_updated IS '上次更新时间';
COMMENT ON COLUMN p10_sa.S98_S_crm_tags.etl_tx_dt IS '';
COMMENT ON TABLE p10_sa.S98_S_crm_tags IS '';
create table if not exists p12_sfull.S98_S_crm_tags (
id TEXT
, name TEXT
, group_name TEXT
, type TEXT
, date_created TEXT
, last_updated TEXT
, etl_tx_dt TIMESTAMP
) ;
COMMENT ON COLUMN p12_sfull.S98_S_crm_tags.id IS '标签对应Id';
COMMENT ON COLUMN p12_sfull.S98_S_crm_tags.name IS '标签名';
COMMENT ON COLUMN p12_sfull.S98_S_crm_tags.group_name IS '标签分组名';
COMMENT ON COLUMN p12_sfull.S98_S_crm_tags.type IS '标签类型';
COMMENT ON COLUMN p12_sfull.S98_S_crm_tags.date_created IS '创建时间';
COMMENT ON COLUMN p12_sfull.S98_S_crm_tags.last_updated IS '上次更新时间';
COMMENT ON COLUMN p12_sfull.S98_S_crm_tags.etl_tx_dt IS '';
COMMENT ON TABLE p12_sfull.S98_S_crm_tags IS '';

View File

@ -0,0 +1,74 @@
# coding: utf-8
import requests
import json
import psycopg2
import uuid
import datetime
import time
import hashlib
import time
#荟聚
#全局变量,便于参数使用的预设值
current_date = datetime.date.today() # 获取当前日期
previous_date = current_date - datetime.timedelta(days=1) # 获取前一天日期
formatted_current_date = current_date.strftime("%Y-%m-%dT%H:%M:%SZ") # 获取当前日期 - 标准化
formatted_previous_date = previous_date.strftime("%Y-%m-%dT%H:%M:%SZ") # 获取前一天日期 - 标准化
timestamp = time.time() # 为Unix time即从"1970-01-01 00:00:00"至今的秒数;
sign_version = 'v2' # 签名版本号固定值v2
nonce = str(uuid.uuid4())
#获取签名令牌
def sign_data(email, open_api_token, timestamp, nonce, sign_version):
# 按照指定的格式拼接字符串
data_to_sign = f"{email}&{open_api_token}&{timestamp}&{nonce}&{sign_version}"
# 使用SHA256算法计算哈希值
sha256_hash = hashlib.sha256(data_to_sign.encode()).hexdigest()
return sha256_hash
#获取鉴权token
def get_token(url):
#请求鉴权接口
authRequest=requests.get(url)
#解析结果
if not authRequest: #若为空时,返回空
return
auth=json.loads(authRequest.text)
return auth
print('开始加载数据huiju_tags:荟聚标签信息')
authUrl='https://api.huiju.cool/v2/oauth2/token?app_id=cl037b184ebccd97c&secret=deaa83fdd8d385eec0d1d04d34282c4ec8c33b60&grant_type=client_credentials'
print('开始请求令牌。')
#authRequest=requests.get(authUrl)
#auth=json.loads(authRequest.text)
auth = get_token(authUrl)
#循环判断auth是否为空若为空等待30s后重新请求
i = 0
while 'error' in auth and i < 60:
time.sleep(60)
auth = get_token(authUrl)
i = i + 1
print('开始请求数据总数。')
url='https://api.huiju.cool/v2/tags'
header={}
body={'access_token':auth['access_token'],}
dataReqL=requests.get(url,headers=header,params=body)
resL=json.loads(dataReqL.text)
# print(resL)
dataList=resL['data']
total=len(dataList)
conn = psycopg2.connect(database="dataops_db", user="dbuser_dops", password="MIgTi3jA",
host="172.17.0.8", port="5432")
print('数据库连接成功')
dataId=str(uuid.uuid4())
print('临时id'+dataId)
json_object = json.dumps(dataList)
cur=conn.cursor()
sql="update data_api.api_data set is_loaded = '1' where api_id = 'a7cf7f4d-108d-410c-9308-e13dfc56';INSERT INTO data_api.api_data (id,api_id,data,total_num,is_loaded,status,request_tm,execute_tm,remark) values (%s,%s,%s,%s,'0','0',current_timestamp(0),current_timestamp(0),'')"
cur.execute(sql,[dataId,'a7cf7f4d-108d-410c-9308-e13dfc56',json_object,total])
conn.commit()
cur.close()
conn.close()
print('加载数据结束huiju_tags:荟聚标签信息')

View File

@ -0,0 +1,42 @@
/*******Main Section**************************************************************************/
\set ON_ERROR_STOP on
\set AUTOCOMMIT on
\timing on
DELETE FROM data_api.crm_tags;
insert into data_api.crm_tags (
id
, name
, group_name
, type
, date_created
, last_updated
,etl_tx_dt
)
select
case when trim(both from id)='' then null else id::text end id
, case when trim(both from name)='' then null else name::text end name
, case when trim(both from group_name)='' then null else group_name::text end group_name
, case when trim(both from type)='' then null else type::text end type
, case when trim(both from date_created)='' then null else date_created::text end date_created
, case when trim(both from last_updated)='' then null else last_updated::text end last_updated
,etl_tx_dt
from (
select
(json_array_elements(data::json)::json->>'id') id
, (json_array_elements(data::json)::json->>'name') name
, (json_array_elements(data::json)::json->>'groupName') group_name
, (json_array_elements(data::json)::json->>'type') type
, (json_array_elements(data::json)::json->>'dateCreated') date_created
, (json_array_elements(data::json)::json->>'lastUpdated') last_updated
,CURRENT_TIMESTAMP(0) etl_tx_dt
from (select * from data_api.api_data
WHERE api_id='a7cf7f4d-108d-410c-9308-e13dfc56' and is_loaded = '0' order by request_tm desc limit 1) p )p;
update data_api.api_data
set is_loaded = '1' ,
status = '1',
request_tm = current_timestamp(0)
where api_id='a7cf7f4d-108d-410c-9308-e13dfc56';
\q