Bringing in URL for host extraction

This commit is contained in:
windlejacob12 2022-09-03 23:27:04 -04:00
parent 0bdf6ac5ea
commit e414debf33

View File

@ -1,14 +1,19 @@
(ns com-jakewindle-git.scraper
(:require [clj-http.client :as client]
[hickory.core :as hick]
[hickory.select :as s]))
[hickory.select :as s])
(:import (java.net URL)))
;; Models
(def stat-urls ["https://www.espn.com/nfl/stats/team/_/season/2011/seasontype/2"])
(def stat-urls ["https://www.espn.com/nfl/stats/team/_/season/2011/seasontype/2"
"https://stats.premierlacrosseleague.com/games/2022/whipsnakes-chaos-2022-6-04"])
(defn not-nil [v]
(not (nil? v)))
(defn get-host [url]
(.getHost (new URL)))
(defn new-page [uri]
(-> uri
(client/get)
@ -26,6 +31,13 @@
(defn init-crawler []
(map #(new-page %) stat-urls))
(defn parse-pll [parsed]
"PLL parser function"
)
(def parse-funcs
{"premierlacrosseleague.com" parse-pll})
;; Entities
(defn greet
"Callable entry point to the application."