afunTW
diff --git a/‎Session_A/answer/02_regular_expression_answer.ipynb‎
Lines changed: 4 additions & 3 deletions b/‎Session_A/answer/02_regular_expression_answer.ipynb‎
Lines changed: 4 additions & 3 deletions
diff --git a/‎Session_A/answer/02_regular_expression_answer.py‎
Lines changed: 48 additions & 20 deletions b/‎Session_A/answer/02_regular_expression_answer.py‎
Lines changed: 48 additions & 20 deletions
diff --git a/‎Session_A/practice/01_BeautifulSoup_functions.ipynb‎
Lines changed: 3 additions & 4 deletions b/‎Session_A/practice/01_BeautifulSoup_functions.ipynb‎
Lines changed: 3 additions & 4 deletions
diff --git a/‎Session_A/practice/02_regular_expression.ipynb‎
Lines changed: 4 additions & 3 deletions b/‎Session_A/practice/02_regular_expression.ipynb‎
Lines changed: 4 additions & 3 deletions
@@ -479,7 +479,7 @@
    "source": [
     "# 如果忘記怎麼寫 requests 或 BeautifulSoup，可以參考\n",
     "\n",
-    "# response = requests.get(\"http://yp.518.com.tw/service-life.html?ctf=10\")\n",
+    "# response = requests.get(\"https://jimmy15923.github.io/518\")\n",
     "# print(response.encoding)\n",
     "\n",
     "# soup = BeautifulSoup(response.text, \"lxml\")"
@@ -494,7 +494,7 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "UTF-8\n",
+      "utf-8\n",
       "['02-29242789', '03-4709933', '04-23601719', '06-2092929', '05-2238686', '07-6994433', '07-3610768', '02-29662939', '02-29662939', '02-29609370']\n"
      ]
     }
@@ -505,7 +505,8 @@
     "from bs4 import BeautifulSoup\n",
     "import re\n",
     "\n",
-    "response = requests.get(\"http://yp.518.com.tw/service-life.html?ctf=10\") # requests 518 網頁 並拿到 response\n",
+    "## 518 網頁伺服器無法容納多人同時 requests，請大家使用以下的網頁作 requests，其 html 的內容是一模一樣的\n",
+    "response = requests.get(\"https://jimmy15923.github.io/518\") # requests 518 網頁 並拿到 response\n",
     "print(response.encoding) # 印出 encoding 結果\n",
     "soup = BeautifulSoup(response.text, \"lxml\")  # 將 HTML 丟給 BeautifulSoup 作解析\n",
     "\n",
 
@@ -25,7 +25,9 @@
 # ### 範例 02-1:  *, +, {} 的用法
 # \* 代表前面的字元可出現零次以上，而 + 則是代表前面的字元至少要出現一次以上，{m,n} 則是代表前面的字元可出現 m 次 ~ n 次
 
-# In[24]:
+# In[1]:
+
+import re
 
 pattern = "a+b*c"
 test_string = 'find aabc, ac, skip abb, dd'
@@ -37,7 +39,9 @@
 # 
 # Hint: 思考一下要尋找的文字跟要濾除的文字，在字母之間有甚麼差異，先把 find 寫出來，再想辦法去掉要 skip 
 
-# In[20]:
+# In[2]:
+
+import re
 
 ### your codes
 pattern = "a*b+c"
@@ -48,7 +52,9 @@
 # ### 範例 02-2: 找到英數字
 # 中括號代表的意思是「這個字元可以是括號內的任何一個」，以數字為例，[0-9]代表這個字元可以是 0~9 之間的任意數字，如果是 [a-z] 則代表是小寫字母 a~z 之間的任意文字，聰明的你，應該可以猜出 [A-Z] 代表的是甚麼意思吧?
 
-# In[26]:
+# In[3]:
+
+import re
 
 pattern = "[0-9]+"
 test_string = '12 drummers drumming, 11 pipers piping, 10 lords a-leaping'
@@ -58,7 +64,9 @@
 # ### 練習 02-2: 找到英數字
 # 在 test_string 中找出所有數字
 
-# In[21]:
+# In[4]:
+
+import re
 
 # your codes
 pattern = "[1-3]+"
@@ -69,14 +77,18 @@
 # ### 範例 02-3: 找到文字
 # 當有指定的文字需要搜尋，可透過 [ ] 搭配 *, + ,{} 進行搜尋
 
-# In[28]:
+# In[5]:
+
+import re
 
 pattern = "[cmf]an"
 test_string = 'find: can, man, fan, skip: dan, ran, pan'
 re.findall(pattern, test_string)
 
 
-# In[29]:
+# In[6]:
+
+import re
 
 pattern = "jim{2,5}y"
 test_string = 'find: jimmy, jimmmy, jimmmmmy, skip: jimy'
@@ -88,7 +100,9 @@
 # 
 # Hint: 如果只找到一個大寫字母，想想甚麼符號代表可出現一次以上?
 
-# In[22]:
+# In[7]:
+
+import re
 
 # your codes
 pattern = "[A-Z]+[a-z]"
@@ -103,7 +117,9 @@
 # 
 # 這時在 "+" 前面加上 "\" (跳脫符號)，這樣做的話 regular expression 就會知道你是要尋找 "+" 
 
-# In[31]:
+# In[8]:
+
+import re
 
 pattern = ".{3}\."
 test_string = 'find: 591., dot., yes., skip: non!'
@@ -113,7 +129,9 @@
 # ### 練習 02-4: 跳脫符號
 # 在 test_string 中找到 A+c, B+d, C+x
 
-# In[23]:
+# In[9]:
+
+import re
 
 # your codes
 pattern = "[A-Z]\+[a-z]"
@@ -124,7 +142,9 @@
 # ### 範例 02-5: 條件式搜尋
 # 當希望不同的搜尋條件都能夠符合時，可以使用「|」這個符號，代表左右邊只要任一一個條件符合，就會回傳
 
-# In[33]:
+# In[10]:
+
+import re
 
 pattern = "I love cats|I love dogs"
 test_string = 'find: I love cats, I love dogs, skip: I love logs, I love cogs'
@@ -134,7 +154,9 @@
 # ### 練習 02-5: 條件式搜尋
 # 在 test_string 中找到 jimy, jimmmy, 但不包含 jimmy, jimmmmy
 
-# In[24]:
+# In[11]:
+
+import re
 
 # your codes
 pattern = "jimy|jim{3}y"
@@ -144,7 +166,9 @@
 
 # ###  範例 02-6: Email 搜尋
 
-# In[35]:
+# In[12]:
+
+import re
 
 email_text = """
 Big Data Analytics/ Deep LearningSocial Computing / Computational Social Science / Crowdsourcing
@@ -159,7 +183,9 @@
 """
 
 
-# In[36]:
+# In[13]:
+
+import re
 
 re.findall("([A-Za-z0-9._]+@[A-Za-z.]+(com|edu)\.tw)", email_text)
 
@@ -174,33 +200,35 @@
 # * text = " ".join(text_list)，這段 code 可以將 list of string 全部變為一個字串
 # * 變成字串後就可以用剛剛學的 re.findall() 找出我們要的目標囉!
 
-# In[37]:
+# In[14]:
 
 # 如果忘記怎麼寫 requests 或 BeautifulSoup，可以參考
 
-# response = requests.get("http://yp.518.com.tw/service-life.html?ctf=10")
+# response = requests.get("https://jimmy15923.github.io/518")
 # print(response.encoding)
 
 # soup = BeautifulSoup(response.text, "lxml")
 
 
-# In[2]:
+# In[15]:
 
 # your codes
 import requests
 from bs4 import BeautifulSoup
+import re
 
-response = requests.get("http://yp.518.com.tw/service-life.html?ctf=10") # requests 518 網頁 並拿到 response
+## 518 網頁伺服器無法容納多人同時 requests，請大家使用以下的網頁作 requests，其 html 的內容是一模一樣的
+response = requests.get("https://jimmy15923.github.io/518") # requests 518 網頁 並拿到 response
 print(response.encoding) # 印出 encoding 結果
 soup = BeautifulSoup(response.text, "lxml")  # 將 HTML 丟給 BeautifulSoup 作解析
 
-
-# In[ ]:
-
+# 找到電話資訊都藏在 li 標籤，屬性 class=comp_tel
 all_phone_text = [tag.text for tag in soup.find_all("li",class_="comp_tel")]
 
+# 把電話資訊的 list 存成一個大 string
 all_phone_text ="".join(all_phone_text)
 
+# 用 regular expression 把全部的電話都找出來
 phone_number = re.findall("0[1-9]+-[0-9]+", all_phone_text)
 print(phone_number)
 
@@ -226,11 +226,10 @@
     "\n",
     "# 2. 發送 requests.get，並將結果存在 response (或自己定義喜歡的變數也可以)\n",
     "# your codes\n",
-    "response = \n",
+    "\n",
     "\n",
     "# 3. 將 response 的 HTML 文字放進 BeautifulSoup，並將結果存在 soup (或自己定義喜歡的變數也可以)\n",
-    "# your codes\n",
-    "soup = "
+    "# your codes\n"
    ]
   },
   {
@@ -276,7 +275,7 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "Q3. 請找出**列3欄3**背後的超連結網址? (請使用 BeautifulSoup + 右鍵→檢查 來找到那個標籤，不要偷偷從網頁點開連結來看喔^^)"
+    "Q3. 請找出**列3欄3**背後的超連結網址? (請使用右鍵→檢查 來找到列3欄3的標籤，不要偷偷從網頁點開連結來看喔^^)"
    ]
   },
   {
 
@@ -5,7 +5,7 @@
    "metadata": {},
    "source": [
     "## 範例 02: regular expression\n",
-    "regular expression 是在搜尋大量文字時非常好用的工具，可以快速回傳符合您要求的文字\n",
+    "regular expression 是在大量文字中蒐尋目標資訊時非常好用的工具，可以快速回傳符合您要求的文字\n",
     "\n",
     "例如尋找任何像是電話號碼、E-mail 信箱的文字\n",
     "\n",
@@ -75,7 +75,7 @@
     "### 練習 02-1: *, +, {} 的用法\n",
     "在 test_string 中找出 abbbbc, bc，但不包含 c, acc\n",
     "\n",
-    "Hint: 思考一下要尋找的文字跟要濾除的文字，在字母之間有甚麼差異，先把 find 寫出來，再想辦法去掉要 skip "
+    "Hint: 思考一下要尋找的文字跟要濾除的文字，在字母之間有甚麼差異"
    ]
   },
   {
@@ -432,7 +432,8 @@
    "source": [
     "# 如果忘記怎麼寫 requests 或 BeautifulSoup，可以參考\n",
     "\n",
-    "# response = requests.get(\"http://yp.518.com.tw/service-life.html?ctf=10\")\n",
+    "## 518 網頁伺服器無法容納多人同時 requests，請大家使用以下的網頁作 requests，其 html 的內容是一模一樣的\n",
+    "# response = requests.get(\"https://jimmy15923.github.io/518\")\n",
     "# print(response.encoding)\n",
     "\n",
     "# soup = BeautifulSoup(response.text, \"lxml\")"
Original file line number	Diff line number	Diff line change
`@@ -226,11 +226,10 @@`
`226`	`226`	`"\n",`
`227`	`227`	`"# 2. 發送 requests.get，並將結果存在 response (或自己定義喜歡的變數也可以)\n",`
`228`	`228`	`"# your codes\n",`
`229`		`- "response = \n",`
	`229`	`+ "\n",`
`230`	`230`	`"\n",`
`231`	`231`	`"# 3. 將 response 的 HTML 文字放進 BeautifulSoup，並將結果存在 soup (或自己定義喜歡的變數也可以)\n",`
`232`		`- "# your codes\n",`
`233`		`- "soup = "`
	`232`	`+ "# your codes\n"`
`234`	`233`	`]`
`235`	`234`	`},`
`236`	`235`	`{`
`@@ -276,7 +275,7 @@`
`276`	`275`	`"cell_type": "markdown",`
`277`	`276`	`"metadata": {},`
`278`	`277`	`"source": [`
`279`		`- "Q3. 請找出列3欄3背後的超連結網址? (請使用 BeautifulSoup + 右鍵→檢查來找到那個標籤，不要偷偷從網頁點開連結來看喔^^)"`
	`278`	`+ "Q3. 請找出列3欄3背後的超連結網址? (請使用右鍵→檢查來找到列3欄3的標籤，不要偷偷從網頁點開連結來看喔^^)"`
`280`	`279`	`]`
`281`	`280`	`},`
`282`	`281`	`{`