Init commit

2026-06-27 18:44:23 +08:00 · 2019-07-18 17:37:40 -04:00
commit 6d711ba63b
5 changed files with 188 additions and 0 deletions
@@ -0,0 +1,44 @@
+import requests
+import re
+import csv
+import lxml
+from bs4 import BeautifulSoup
+
+sec_url = 'https://www.sec.gov'
+
+def get_request(url):
+    return requests.get(url)
+
+def create_url(cik):
+    return 'https://www.sec.gov/cgi-bin/browse-edgar?CIK={}&owner=exclude&action=getcompany&type=13F-HR'.format(cik)
+
+def get_user_input():
+    cik = input("Enter 10-digit CIK number: ")
+    return cik
+
+requested_cik = get_user_input()
+
+# Find mutual fund by CIK number on EDGAR
+response = get_request(create_url(requested_cik))
+soup = BeautifulSoup(response.text, "html.parser")
+tags = soup.findAll('a', id="documentsbutton")
+
+# Find latest 13F report for mutual fund
+response_two = get_request(sec_url + tags[0]['href'])
+soup_two = BeautifulSoup(response_two.text, "html.parser")
+tags_two = soup_two.findAll('a', attrs={'href': re.compile('xml')})
+xml_url = tags_two[3].get('href')
+
+response_xml = get_request(sec_url + xml_url)
+soup_xml = BeautifulSoup(response_xml.content, "lxml")
+
+# Find all issuers
+issuers = soup_xml.body.findAll(re.compile('nameofissuer'))
+for issuer in issuers:
+    print(issuer.text)
+
+# Write issuer names to TSV file
+with open('{}.tsv'.format(requested_cik), 'wt') as out_file:
+    tsv_writer = csv.writer(out_file, delimiter='\t')
+    for issuer in issuers:
+        tsv_writer.writerow([issuer.text])