python_apps/crwlers/tmp_get_cateExt.py
2023-11-03 14:49:12 +09:00

39 lines
1.2 KiB
Python

#!/usr/bin/env python
import requests, bs4, urllib, sys, logging, re, subprocess
from urllib import parse
from datetime import datetime
startTime = datetime.now()
def makeURL(url,term,campaign) :
url = url + "&BIZ_CD=1010187&utm_source=naverPowerlink&utm_medium=prdcpc&utm_keyword=" + term + "&utm_campaign=" + campaign + "&utm_content=category"
return url
srcTerm = str(sys.argv[1])
prefix = str(sys.argv[2])
suffix = str(sys.argv[3])
url = str(sys.argv[4])
prefixArr = prefix.split(",")
suffixArr = suffix.split(",")
prefixed = []
suffixed = []
print(srcTerm + "\t" + srcTerm + "\t" + makeURL(url,srcTerm,"category"))
for i in range(len(suffixArr)) :
if suffixArr[i] != "" :
suffixedterm = srcTerm + suffixArr[i]
suffixed.insert(i,suffixedterm)
print(srcTerm + "\t" + suffixedterm + "\t" + makeURL(url,suffixedterm,"ext"))
if len(prefixArr) != 0 :
for i in range(len(prefixArr)) :
if prefixArr[i] != "" :
prefixedterm = prefixArr[i] + srcTerm
prefixed.insert(i,prefixedterm)
print(srcTerm + "\t" + prefixedterm + "\t" + makeURL(url,prefixedterm,"ext"))
for j in range(len(suffixed)) :
fixedterm = prefixArr[i] + suffixed[j]
print(srcTerm + "\t" + fixedterm + "\t" + makeURL(url,fixedterm,"ext"))