diff --git a/HW_Girls_Probabbility.ipynb b/HW_Girls_Probabbility.ipynb new file mode 100644 index 0000000..0fad506 --- /dev/null +++ b/HW_Girls_Probabbility.ipynb @@ -0,0 +1,96 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 1, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "1" + ] + }, + "execution_count": 1, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "import random\n", + "import numpy as np\n", + "result = np.random.choice([0,1], p = [0.51,0.49])\n", + "result" + ] + }, + { + "cell_type": "code", + "execution_count": 23, + "metadata": {}, + "outputs": [], + "source": [ + "def get_girl_prob(n):\n", + " import random\n", + " import numpy as np\n", + " girl_count = 0\n", + " for i in range(n):\n", + " total = []\n", + " while len(total) < 3:\n", + " result = np.random.choice([0,1], p = [0.51,0.49])\n", + " total.append(result)\n", + " if 1 in total:\n", + " girl_count += 1\n", + " break \n", + " return girl_count/n" + ] + }, + { + "cell_type": "code", + "execution_count": 24, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "0.86716" + ] + }, + "execution_count": 24, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "get_girl_prob(100000)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.6.5" + } + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/W2_HW_Web_Scrap_Yahoo_Movie.ipynb b/W2_HW_Web_Scrap_Yahoo_Movie.ipynb new file mode 100644 index 0000000..a2ec995 --- /dev/null +++ b/W2_HW_Web_Scrap_Yahoo_Movie.ipynb @@ -0,0 +1,3276 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [], + "source": [ + "from bs4 import BeautifulSoup\n", + "import requests" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " 驚奇4超人 The Fantastic Four - Yahoo奇摩電影\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
\n", + "
\n", + "
\n", + " \n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + " \n", + " \n", + "
\n", + " \n", + "
\n", + "
\n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + " \n", + "
\n", + "
\n", + " 追蹤我們\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + " \n", + "
\n", + " \n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
\n", + "
\n", + "
\n", + " \n", + " \n", + "
\n", + "
\n", + " \n", + " 選擇\n", + "
\n", + " 片名\n", + "
\n", + " \n", + " \n", + " 選擇\n", + "
\n", + " 地區\n", + "
\n", + " \n", + "
\n", + " 查詢\n", + "
\n", + "
\n", + "
\n", + " \n", + "
\n", + "
\n", + " \n", + " 選擇\n", + "
\n", + " 分類\n", + "
\n", + " \n", + " \n", + " 選擇\n", + "
\n", + " 頻道\n", + "
\n", + " \n", + "
\n", + " 查詢\n", + "
\n", + "
\n", + "
\n", + " \n", + "
\n", + " 查詢\n", + "
\n", + "
\n", + "
\n", + " \n", + "
\n", + "
\n", + " \n", + " 選擇\n", + "
\n", + " 戲院\n", + "
\n", + " \n", + " \n", + " 選擇\n", + "
\n", + " 片名\n", + "
\n", + " \n", + " \n", + " 選擇\n", + "
\n", + " 日期\n", + "
\n", + " \n", + " \n", + " 選擇\n", + "
\n", + " 場次\n", + "
\n", + " \n", + " \n", + " 選擇\n", + "
\n", + " 數量\n", + "
\n", + " \n", + "
\n", + " 查詢\n", + "
\n", + "
\n", + "
\n", + " \n", + "
\n", + "
\n", + " \n", + "
\n", + "
\n", + "
\n", + " 查詢\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
\n", + "
\n", + " \n", + " 電影排行榜\n", + " \n", + "
\n", + "
\n", + "
    \n", + "
  • \n", + " 台北票房榜\n", + "
  • \n", + "
  • \n", + " 全美票房榜\n", + "
  • \n", + "
  • \n", + " 預告片榜\n", + "
  • \n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + " \n", + " \"\"\n", + " \n", + "
\n", + "
\n", + " \n", + " 潛艦獵殺令\n", + " \n", + " \n", + "

\n", + " ★《#玩命關頭》《#全面攻佔》金牌團隊聯手打造\n", + "

\n", + "

\n", + " ★鐵漢男星《氣象戰》#傑瑞德巴特勒 X 金獎影帝 #蓋瑞歐德曼\n", + "

\n", + "

\n", + " ★史詩級 #磅礡潛艦海戰,超震撼 #大型艦對艦battle\n", + "

\n", + "

\n", + " ★繼《#獵殺U571》後再創全新經典潛艇電影\n", + "

\n", + "

\n", + " ★改編自唐凱思及喬治華萊士創作小說《#砲擊點》\n", + "

\n", + "

\n", + "

\n", + "

\n", + " 在北極海的海底深處,美國潛艦艦長喬葛拉斯(傑瑞德巴特勒 飾)在搜尋一艘落難的美國潛艇時,意外發現俄國即將發生一場軍事政變,眼看就要瓦解世界的秩序。葛拉斯艦長要保護艦上人員的安危,更要捍衛國土,他現在必須集結一支海軍精英特種部隊,前往搭救被綁架的俄國總統,並潛入敵軍的海域阻止第三次世界大戰的爆發。\n", + "

\n", + "

\n", + "

\n", + "

\n", + " 本片雲集重量級演員卡司,陣容包含蘇格蘭鐵漢男星《氣象戰》傑瑞德巴特勒、奧斯卡金獎影帝《最黑暗的時刻》蓋瑞歐德曼、《捍衛任務2:殺神回歸》凡夫俗子、《復仇者聯盟2:奧創紀元》琳達卡迪林尼、以及《007:誰與爭鋒》托比史第文斯,是一部緊張刺激的驚悚片,橫跨海陸場景,台美即將同步上映。\n", + "

\n", + "

\n", + "

\n", + "
\n", + "
\n", + "
\n", + " \n", + "
\n", + " 統計時間 : 2018-11-03~2018-11-04\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + " \n", + " \"\"\n", + " \n", + "
\n", + "
\n", + " \n", + " 波希米亞狂想曲\n", + " \n", + " \n", + "

\n", + " ★搖滾不死!皇后合唱團傳記電影首登大銀幕 神曲百分百催淚再詮釋\n", + "
\n", + " ★《波希米亞狂想曲》傳奇主唱佛萊迪墨裘瑞 華麗奇幻一生感動上映\n", + "
\n", + " ★他們是你偶像的偶像 史上最暢銷搖滾樂團之一 影響世界樂壇近半世紀\n", + "
\n", + "
\n", + " 《波希米亞狂想曲》以搖滾經典的不敗傳奇「皇后合唱團」為中心環繞;描述他們的音樂以及其樂團的靈魂人物──主唱佛萊迪墨裘瑞(雷米馬利克飾)短暫卻刻骨銘心的一生,如何靠著音樂打破世俗常規,奠定了搖滾樂的基石,成為地球史上最偉大的藝術家之一。\n", + "
\n", + "
\n", + " 電影透過他們極具原創性與獨樹一格的標誌曲風,和墨裘瑞充滿爆發性且穿透力的歌聲,描述了皇后合唱團的崛起,以及其一路如何成功風靡了全球樂迷的心;然而,在外界看不到的背後,這個看速堅固的經典傳奇卻藏匿著一觸即發的潛在衝突,就如同於墨裘瑞的生活方式一般,快速地被捲入漩渦且即將失去控制。\n", + "
\n", + "
\n", + " 但即便是在被病魔纏身的狀況之下,墨裘瑞依然乘載著樂迷們的期待,引領著樂團一同於Live Aid的舞台上,成功締造了本世紀最偉大的表演舞台。皇后合唱團華麗且迷幻的心路歷程,不只是鞏固著隊友之間親如家人的情感,以及再次顯示了他們對音樂的執著及血脈傳承。即便到今日,他們的精神也都能夠持續地透過經典,感染並激勵著地球上的每一個角落,包括所有的夢想家及樂迷們。\n", + "

\n", + "
\n", + "
\n", + "
\n", + " \n", + "
\n", + " 統計時間 : 2018-11-02~2018-11-04\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + " \n", + " \"\"\n", + " \n", + "
\n", + "
\n", + " \n", + " 怪獸與葛林戴華德的罪行\n", + " \n", + " \n", + "

\n", + " 華納兄弟影業再度推出JK羅琳魔法世界全新冒險五部曲中的第二部大作:《怪獸與葛林戴華德的罪行》。\n", + "

\n", + "

\n", + "

\n", + "

\n", + " 在第一部電影的尾聲,美國魔法國會在紐特斯卡曼德(艾迪瑞德曼 飾 )的協助下,成功緝捕強大的黑巫師蓋勒葛林戴華德(強尼戴普 飾)到案。但不久後葛林戴華德驗證了先前放話的威脅,成功逃離大牢並開始廣收信眾,這些人大多不知他背後的真實目標:培養一群純種巫師大軍,好統御所有莫魔生靈。\n", + "

\n", + "

\n", + "

\n", + "

\n", + " 為了阻撓葛林戴華德的計畫,阿不思鄧不利多(裘德洛 飾)招攬他往日的學生紐特斯卡曼德來幫忙,紐特也欣然接下任務,但卻對前方重重的阻礙及危險渾然不知。此行揭開了派系的鬥爭及分野,愛情及忠誠度受到嚴峻考驗,就連最親近的朋友及家人也面臨測試,魔法世界的嫌隙及鴻溝日益擴大。\n", + "

\n", + "

\n", + "

\n", + "

\n", + " 本片眾星雲集的卡司由:艾迪瑞德曼、凱薩琳華特斯頓、丹富樂、艾莉森蘇朵、伊薩米勒,以及裘德洛與強尼戴普等人領銜主演。其他卡司班底包括:柔伊克拉維茲、卡倫透納、金秀賢、威廉奈迪蘭、凱文格斯里、卡門艾喬格,以及帕琵柯比圖奇。\n", + "

\n", + "

\n", + "

\n", + "

\n", + " 《怪獸與葛林戴華德的罪行》由大衛葉慈執導,劇本由JK羅琳親自操刀。本片由大衛海曼、JK羅琳、史提夫克羅夫斯,以及萊恩諾維格蘭出任製片。\n", + "

\n", + "

\n", + "

\n", + "

\n", + " 本片預計於2018年11月16日上映,並由華納兄弟娛樂公司旗下的華納兄弟影業負責全球發行,以2D及3D形式播放,並在特定戲院以IMAX形式上映。\n", + "

\n", + "
\n", + "
\n", + "
\n", + " \n", + "
\n", + " 統計時間 : 2018-11-10\n", + "
\n", + "
\n", + "
\n", + " \n", + " \n", + " \n", + "
\n", + "
\n", + "
\n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
\n", + "
\n", + " \n", + "
\n", + "
\n", + " \n", + " 你最近瀏覽的電影\n", + " \n", + "
\n", + "
\n", + "
    \n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + " \n", + "
\n", + " \n", + " \"\"\n", + " \n", + " \n", + " \"\"\n", + " \n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + " \"\"\n", + "
\n", + " \n", + "
\n", + "
\n", + "
\n", + "
\n", + "

\n", + " 驚奇4超人\n", + "

\n", + "

\n", + " The Fantastic Four\n", + "

\n", + "
\n", + "
\n", + " \n", + " 動作\n", + " \n", + "
\n", + "
\n", + " \n", + " 科幻\n", + " \n", + "
\n", + "
\n", + " \n", + " 上映日期:2015-08-06\n", + " \n", + " \n", + " 片  長:01時40分\n", + " \n", + " \n", + " 發行公司:福斯影業\n", + " \n", + " \n", + " IMDb分數:4.3\n", + " \n", + " \n", + " 導演:\n", + " \n", + "
\n", + " 喬許傳克\n", + "
\n", + " \n", + " 演員:\n", + " \n", + " \n", + " \n", + " 官方連結:\n", + " \n", + " \n", + " https://www.facebook.com/foxmovies.tw\n", + " \n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + " 期待度\n", + "
\n", + "
\n", + "
\n", + "

\n", + " 電影已上映,不開放投票\n", + "

\n", + " \n", + " (共183人投票)\n", + " \n", + "
\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
\n", + "
\n", + " \n", + " 80\n", + " \n", + " %\n", + "
\n", + " 想看\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + " 滿意度\n", + "
\n", + "
\n", + "
\n", + "

\n", + " 請給這部電影評分:\n", + "

\n", + "

\n", + " 尚未開放網友評分\n", + "

\n", + "
\n", + "
\n", + " \n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + " \n", + " \n", + "
\n", + "
\n", + "
\n", + " \n", + " (共366人投票)\n", + " \n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + " 2.3\n", + "
\n", + " 總評分\n", + "
\n", + "
\n", + " \n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + " \n", + " \n", + " \n", + "
\n", + "
\n", + " \n", + " 最新預告片\n", + " \n", + "
\n", + "
\n", + "
\n", + " 共14支\n", + "
\n", + "
\n", + "
\n", + " \n", + "
\n", + "
\n", + " \n", + "
\n", + "
\n", + " \n", + " 精彩劇照\n", + " \n", + "
\n", + "
\n", + "
\n", + " 共15張\n", + "
\n", + "
\n", + " \n", + "
\n", + " \n", + "
\n", + "
\n", + " \n", + " 劇情介紹\n", + " \n", + "
\n", + "
\n", + "
\n", + "
\n", + " \n", + " ★ 重新啟動 全新陣容再掀熱潮 今年暑假超級強片首選!\n", + "
\n", + " ★ 漫威英雄系列漫畫超經典創始作 最歷久不衰之暢銷漫畫 全球熱銷超過45億台幣\n", + "
\n", + " ★ 《X戰警》系列王牌編劇、製作 親自操刀編劇\n", + "
\n", + "
\n", + " 福斯影片重金打造全新《驚奇4超人》英雄漫畫鉅作再度搬上大銀幕,改編自漫威漫畫(Marvel)的超人氣經典,描述四位原本生活平凡的年輕人,被傳送至一個處處充滿危機的宇宙時空,從此四人的外貌身形都起了巨大的變化。而這些無法逆轉的身體變化也促使「驚奇4超人」,重新適應學習,並善用他們的超能力,同時併肩合作以抵禦外侮,保護即將遭敵軍破壞殆盡的地球家園,但他們所要對抗的竟是昔日摯友…\n", + "
\n", + "
\n", + " 詳全文\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + " \n", + " 展開劇情簡介\n", + " \n", + "
\n", + "
\n", + "
\n", + " \n", + "
\n", + "
\n", + " \n", + " 相關文章\n", + " \n", + "
\n", + " 共3則\n", + "
\n", + "
\n", + "
\n", + " \n", + " \n", + "
\n", + "
\n", + " \n", + "
\n", + "
\n", + " \n", + " 網友短評\n", + " \n", + "
\n", + " 共129則\n", + "
\n", + "
\n", + "
\n", + "
\n", + "
\n", + " 排序:\n", + " \n", + " \n", + "
\n", + "
\n", + "
    \n", + "
  • \n", + "
    \n", + "
    \n", + " \n", + "
    \n", + "

    \n", + " 網友評分:\n", + "

    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
    \n", + "
    \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
    \n", + "
    \n", + " \n", + " \n", + " 回應評論\n", + "
    \n", + " \n", + " 檢舉\n", + " \n", + "
    \n", + " \n", + " 看完感覺真的沒什麼劇情,但是至少還有特效...\n", + " \n", + "
    \n", + " 發表人:張阿策\n", + "
    \n", + "
    \n", + " 發表時間:2016-08-14 21:58:53\n", + "
    \n", + "
    \n", + " 顯示回應(0)\n", + "
    \n", + "
    \n", + "
    \n", + " 顯示更多內容\n", + "
    \n", + "
    \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
    \n", + "
    \n", + "
  • \n", + "
  • \n", + "
    \n", + "
    \n", + " \n", + "
    \n", + "

    \n", + " 網友評分:\n", + "

    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
    \n", + "
    \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
    \n", + "
    \n", + " \n", + " \n", + " 回應評論\n", + "
    \n", + " \n", + " 檢舉\n", + " \n", + "
    \n", + " \n", + " 还抄襲前幾年一樣的作品,,,真難看,也很幼稚,,敗拖可別學別人出第2集\n", + " \n", + "
    \n", + " 發表人:man\n", + "
    \n", + "
    \n", + " 發表時間:2016-07-31 13:07:07\n", + "
    \n", + "
    \n", + " 顯示回應(0)\n", + "
    \n", + "
    \n", + "
    \n", + " 顯示更多內容\n", + "
    \n", + "
    \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
    \n", + "
    \n", + "
  • \n", + "
  • \n", + "
    \n", + "
    \n", + " \n", + "
    \n", + "

    \n", + " 網友評分:\n", + "

    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + "
    \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
    \n", + "
    \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
    \n", + "
    \n", + " \n", + " \n", + " 回應評論\n", + "
    \n", + " \n", + " 檢舉\n", + " \n", + "
    \n", + " \n", + " Wasted my money and time\n", + " \n", + "
    \n", + " 發表人:Shpqe1雅虎測試\n", + "
    \n", + "
    \n", + " 發表時間:2016-07-25 18:35:32\n", + "
    \n", + "
    \n", + " 顯示回應(0)\n", + "
    \n", + "
    \n", + "
    \n", + " 顯示更多內容\n", + "
    \n", + "
    \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
    \n", + "
    \n", + "
  • \n", + "
\n", + " \n", + "
\n", + "
\n", + " \n", + "
\n", + "
\n", + "
\n", + " \n", + "
\n", + " \n", + "
    \n", + "
  • \n", + " \n", + " 與本電影無關、捏造假冒、不實敘述\n", + "
  • \n", + "
  • \n", + " \n", + " 具有廣告性質或大量重複散布\n", + "
  • \n", + "
  • \n", + " \n", + " 相互惡意攻訐、猥褻騷擾、人身攻擊\n", + "
  • \n", + "
  • \n", + " \n", + " 侵犯隱私權、違反智慧財產權、涉及違法情事\n", + "
  • \n", + "
  • \n", + " \n", + " 違背善良風俗\n", + "
  • \n", + "
\n", + "
\n", + " 確認送出\n", + "
\n", + "
\n", + " \"\"\n", + "
\n", + " \n", + "
\n", + " \n", + "
\n", + "
\n", + "
\n", + " \n", + " \n", + "
\n", + "
\n", + "
\n", + "
\n", + " \n", + "
\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "\n", + "\n" + ] + } + ], + "source": [ + "source = requests.get('https://movies.yahoo.com.tw/movieinfo_main.html/id=5644').text\n", + "soup = BeautifulSoup(source, 'lxml')\n", + "print(soup.prettify())\n" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "驚奇4超人 The Fantastic Four \n" + ] + } + ], + "source": [ + "title = soup.find('title').text.replace('- Yahoo奇摩電影',' ')\n", + "print(title)" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "驚奇4超人\n" + ] + } + ], + "source": [ + "title_cn = soup.find('div', class_='movie_intro_info_r').h1.text\n", + "print(title_cn)" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "The Fantastic Four\n" + ] + } + ], + "source": [ + "title_en = soup.find('div', class_='movie_intro_info_r').h3.text\n", + "print(title_en)" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "上映日期:2015-08-06\n" + ] + } + ], + "source": [ + "date = soup.find('div', class_='movie_intro_info_r').span.text\n", + "print(date)" + ] + }, + { + "cell_type": "code", + "execution_count": 93, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "['動作', '科幻']" + ] + }, + "execution_count": 93, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "genre= []\n", + "for movie_genre in soup.find_all('div', class_='level_name'):\n", + " for t in movie_genre.find_all('a', class_='gabtn'):\n", + " genre.append(t.text.replace('\\n', \" \").strip())\n", + "genre" + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "上映日期:2015-08-06 片  長:01時40分 發行公司:福斯影業\n" + ] + } + ], + "source": [ + "movie_info = []\n", + "for span in soup.find_all('div', class_='movie_intro_info_r'):\n", + " for text in span.find_all('span'):\n", + " movie_info.append(text.text)\n", + "length = movie_info [0]\n", + "date = movie_info[1]\n", + "company = movie_info[2]\n", + "print(length, date, company)" + ] + }, + { + "cell_type": "code", + "execution_count": 72, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "['傑米貝爾(Jamie Bell)', '凱特瑪拉(Kate Mara)', '麥爾斯泰勒(Miles Teller)', '麥可B喬丹(Michael B. Jordan)']\n", + "喬許傳克 \n" + ] + } + ], + "source": [ + "cast_list = []\n", + "for cast in soup.find_all('div', class_='movie_intro_list'):\n", + " if len(cast.text) == 4:\n", + " director = cast.text\n", + " else:\n", + " for actor in cast.find_all('a'):\n", + " cast_list.append(actor.text)\n", + "director = director.replace(\"'\\n\", ' ').replace(\"\\n\", \" \").lstrip()\n", + "print(cast_list)\n", + "print(director)" + ] + }, + { + "cell_type": "code", + "execution_count": 15, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "https://movies.yahoo.com.tw/moviegenre_result.html?genre_id=01\n" + ] + } + ], + "source": [ + "for web in soup.find_all('div', class_='movie_intro_info_r'):\n", + " website = web.find('a',class_=\"gabtn\")['href']\n", + " print(website)\n", + " " + ] + }, + { + "cell_type": "code", + "execution_count": 16, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "★ 重新啟動 全新陣容再掀熱潮 今年暑假超級強片首選!★ 漫威英雄系列漫畫超經典創始作 最歷久不衰之暢銷漫畫 全球熱銷超過45億台幣★ 《X戰警》系列王牌編劇、製作 親自操刀編劇福斯影片重金打造全新《驚奇4超人》英雄漫畫鉅作再度搬上大銀幕,改編自漫威漫畫(Marvel)的超人氣經典,描述四位原本生活平凡的年輕人,被傳送至一個處處充滿危機的宇宙時空,從此四人的外貌身形都起了巨大的變化。而這些無法逆轉的身體變化也促使「驚奇4超人」,重新適應學習,並善用他們的超能力,同時併肩合作以抵禦外侮,保護即將遭敵軍破壞殆盡的地球家園,但他們所要對抗的竟是昔日摯友…\n", + " \n" + ] + } + ], + "source": [ + "summary = soup.find('div',class_='gray_infobox_inner').span.text.lstrip()\n", + "print(summary)" + ] + }, + { + "cell_type": "code", + "execution_count": 152, + "metadata": {}, + "outputs": [], + "source": [ + "import csv\n", + "csv_file = open('webscrap_yahoo.csv', 'w')\n", + "csv_writer = csv.writer(csv_file)\n", + "csv_writer.writerow(['Title_EN','Date','Genre','Length','Director','Cast','Production','Website','Plot']) \n", + "csv_writer.writerow([title_cn])\n", + "csv_file.close()" + ] + }, + { + "cell_type": "code", + "execution_count": 94, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
TitleDateGenreLengthCompanyDirectorCastWebsiteSummary
0驚奇4超人 The Fantastic Four片  長:01時40分[動作, 科幻]上映日期:2015-08-06發行公司:福斯影業喬許傳克 ...[傑米貝爾(Jamie Bell), 凱特瑪拉(Kate Mara), 麥爾斯泰勒(Mile...https://movies.yahoo.com.tw/moviegenre_result....★ 重新啟動 全新陣容再掀熱潮 今年暑假超級強片首選!★ 漫威英雄系列漫畫超經典創始作 最歷...
\n", + "
" + ], + "text/plain": [ + " Title Date Genre Length \\\n", + "0 驚奇4超人 The Fantastic Four 片  長:01時40分 [動作, 科幻] 上映日期:2015-08-06 \n", + "\n", + " Company Director \\\n", + "0 發行公司:福斯影業 喬許傳克 ... \n", + "\n", + " Cast \\\n", + "0 [傑米貝爾(Jamie Bell), 凱特瑪拉(Kate Mara), 麥爾斯泰勒(Mile... \n", + "\n", + " Website \\\n", + "0 https://movies.yahoo.com.tw/moviegenre_result.... \n", + "\n", + " Summary \n", + "0 ★ 重新啟動 全新陣容再掀熱潮 今年暑假超級強片首選!★ 漫威英雄系列漫畫超經典創始作 最歷... " + ] + }, + "execution_count": 94, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "my_dict = {'Title':[title],'Date':[date],'Genre':[genre],'Length':[length], 'Company': [company], 'Director':[director], 'Cast':[cast_list],\n", + " 'Website':[website],'Summary':[summary]}\n", + "import pandas as pd\n", + "df = pd.DataFrame(my_dict)\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.6.5" + } + }, + "nbformat": 4, + "nbformat_minor": 2 +}