extract url parameters python
#Analysing URL parameters with Python for SEO
from pandas import DataFrame, read_csv
import urllib.parse as urlparse
from urllib.parse import parse_qs
input_file = "spreadsheet.csv"
output_file = "output.csv"
url_column = "Address"
urls = read_csv(input_file, usecols=[url_column])[url_column].unique()
parameters = {}
print(f"Analysing {len(urls)} urls ...")
for url in urls:
query_string = urlparse.urlparse(url)
for param in parse_qs(query_string.query):
parameters[param] = parameters.get(param, 0) + 1
parameters = [(key, value) for key, value in sorted(parameters.items(),
key=lambda item: item[1], reverse=True)]
print(f"{len(parameters)} unique URL parameters found.")
print(f"Saving output to {output_file}...")
DataFrame(parameters, columns=["Parameter","Count"]).to_csv(output_file, index=False)
Are there any code examples left?
New code examples in category Python
-
Python 2023-04-11 03:04:20
-
Python 2022-03-27 22:40:04 pycharm no module named
-
Python 2022-03-27 22:25:05 assign multiple variablesin one line
-
Python 2022-03-27 22:20:02 levenshtein distance
-
Python 2022-03-27 21:35:09 get text from url python last slash
-
Python 2022-03-27 21:30:30 df concatenate df
-
Python 2022-03-27 21:25:09 python odd or even
-
Python 2022-03-27 21:15:32 python include function from another file
-
Python 2022-03-27 21:10:01 color module python
-
Python 2022-03-27 21:00:27 python tkinter cursor types