美文网首页Python三期爬虫作业
【Python爬虫】--第二周_2作业

【Python爬虫】--第二周_2作业

作者: _孙小籽 | 来源:发表于2017-07-28 10:03 被阅读12次

    18

     # two argument
    def print_two(*args):
        arg1, arg2 = args
        print("arg1: %r, arg2: %r"  % (arg1, arg2))
    
    #The other two argument
    def print_two_again(arg1, arg2):
        print("arg1: %r, arg2: %r" %(arg1, arg2))
    
    #The one argument
    def print_one(arg1):
        print("arg1: %r" % arg1)
    
    def print_None():
        print("arg1:")
    
    print_two("z", 3)
    print_two_again("one", "two")
    print_one("onlyone")
    print_None()
    

    19

    #定义一个函数,需要两个参数
    def chesses_and_crackers(chesses_count, boxes_and_crackers):
        print("You have %r chesses" % chesses_count)
        print("You have %r boxes and crackers" % boxes_and_crackers)
        print("Men, that's enough for a party!")
        print("Get a blanket. \n")
    
    #调用函数,参数参数使用int
    print("We can just give the function number directly.")
    chesses_and_crackers(10, 20)
    
    #给两个变量赋值,调用函数,参数使用已赋值过的变量
    print("Or, we can use variable from our script:")
    amount_of_chesses = 10
    amount_of_crackers = 20
    chesses_and_crackers(amount_of_chesses, amount_of_crackers)
    
    #调用函数,参数使用计算式
    print("We can even do math inside too")
    chesses_and_crackers(10+3, 20+7)
    
    #调用函数,参数使用变量加上常量的计算
    print("And we can combine the two, variable and math")
    chesses_and_crackers(amount_of_chesses + 10, 20 + amount_of_crackers)
    
    #调用函数,一个参数使用变量,一个使用常量
    print("And we can combine the two, variable or math")
    chesses_and_crackers(amount_of_chesses, 20 )
    

    20

    from sys import argv
    
    script, input_file = argv
    
    def print_all(f):
        print(f.read())
    
    def rewind(f):
        f.seek(0)
    
    def print_a_line(line_count, f):
        print(line_count, f.readline())
    
    current_file = open(input_file)
    
    print_all(current_file)
    
    print("Now let's rewind, kind of like a tape.")
    rewind(current_file)
    
    print("Let's print three lines:")
    current_line = 1
    print_a_line(current_line, current_file)
    print_a_line(current_line + 1, current_file)
    print_a_line(current_line + 2, current_file)
    

    21

    def add(a,b):
        print("ADDING %d + %d" %(a, b))
        return a + b
    
    def subtract(a, b):
        print("SUBTRACTING %d - %d" %(a, b))
        return a - b
    
    def multiply(a, b):
        print("MULTIPLY %d * %d" %(a,b))
        return a * b
    
    def divide(a, b):
        print("DIVIDING %d / %d" %(a,b))
        return a / b
    
    print("Let's do some math with just functions!")
    
    age = add(30, 5)
    height = subtract(78, 4)
    weight = multiply(90, 2)
    iq = divide(100, 2)
    
    print("Age: %d, Height: %d, Weight: %d, IQ: %d" %(age, height, weight, iq))
    print("Here is a puzzle.")
    what = add(age, subtract(height, multiply(weight, divide(iq, 2))))
    print("That becomes:", what, "can you do it by hard?")
    

    23

    import requests
    from lxml import etree
    from datetime import datetime as dt
    #url变量
    job_url='http://www.jianshu.com/p/5ddb3cda7c00'
    #变量赋值为url请求的内容
    html=requests.get(job_url).content
    #解析html内容
    selector=etree.HTML(html)
    #作业名变量
    file_base_name='作业_%s.txt'
    #现在的时间变成字符串变量
    create_time=dt.strftime(dt.now(),'%Y-%m-%d')
    #正则表达式提取html文件中的title内容
    title=selector.xpath('//div[@class="article"]/h1[@class="title"]/text()')[0].strip()
    #则表达式提取html文件中的content内容
    content_data=selector.xpath('//div[@class="show-content"]//text()')
    #url
    baidu_href='https://pan.baidu.com/s/1eSvg7HS'
    #url
    zhuanti_url='http://www.jianshu.com/c/1b31f26b6af0'
    #文件名格式化字符串入时间的字符串
    file_name=file_base_name%create_time
    #打开文件名写入
    with open(file_name,'w') as f:
        #写作业标题,写空行
        f.write('【作业标题】'+ title)
        f.write('\n')
        #写入专题url
        f.write('python三期爬虫作业交稿专题地址====》:' + zhuanti_url)
        f.write('\n')
        #
        f.write('本帖持续更新,录制视频资源及时更新在下面百度云下载链接 请及时查看群公告')
        f.write('\n')
        #写入百度云地址
        f.write('百度云下载链接:' + baidu_href)
        f.write('\n')
        #循环检查内容部分,以"百度"或者"群公告"开始的忽略,其余的打印并写入文件,然后退出循环
        for i in content_data:
            if i.startswith('百度') or  i.startswith('群公告'):
                continue
            else:
                print (i)
                f.write(i.strip())
                f.write('\n')
        f.close()
    
    #### 24
    print("Let's practice everything.")
    print('You\'d need to know \'bout escapes with \\ that do \n newlines and \t tabs.')
    
    poem = """
    \tThe lovely world
    with logic so firmly planted
    cannot discern \n the needs of love nor comprehend passion from intuition and requires an explanation \n\t\twhere there is none.
    """
    print("_________________")
    print(poem)
    print("_________________")
    
    five = 10 -2 + 3 - 6
    print("This should be five: %s" % five)
    
    def secret_formula(started):
        jelly_beans = started * 500
        jars = jelly_beans / 1000
        crates = jars / 100
        return jelly_beans, jars, crates
    
    start_point = 10000
    beans, jars, crates = secret_formula(start_point)
    
    print("With a starting point of: %d" % start_point)
    print("We'd have %d beans, %d jars, and %d crates." % (beans, jars, crates))
    start_point = start_point / 10
    
    print("We can also do that this way:")
    print("We'd have %d beans, %d jars, and %d crates." % secret_formula(start_point))
    

    25

    def break_words(stuff):
        """This function will break up words for us."""
        words = stuff.split(' ')
        return words
    
    def sort_words(words):
        """Sorts the words."""
        return sorted(words)
    
    def print_first_word(words):
        """Prints the first word after popping it off."""
        words = words.pop(0)
        print(words)
    
    def print_last_word(words):
        """Prints the last word after popping it off."""
        word = words.pop(-1)
        print(word)
    
    def sort_sentence(sentence):
        """Takes in a full sentence and returns the sorted words."""
        words = break_words(sentence)
        return sort_words(words)
    
    def print_first_and_last(sentence):
        """Prints the first and last words of the sentence."""
        words = break_words(sentence)
        print_first_word(words)
        print_last_word(words)
    
    def print_first_and_last_sorted(sentence):
        """Sorts the words then prints the first and last one."""
        words = sort_sentence(sentence)
        print_first_word(words)
        print_last_word(words)
    
    words = input("...>... ")
    print_first_and_last_sorted(words)
    print_first_and_last(words)
    

    26

    def break_words(stuff):
        """This function will break up words for us."""
        words = stuff.split(' ')
        return words
    
    def sort_words(words):
        """Sorts the words."""
        return sorted(words)
    
    def print_first_word(words):
        """Prints the first word after popping it off."""
        word = words.pop(0)
        print(word)
    
    def print_last_word(words):
        """Prints the last word after popping it off."""
        word = words.pop(-1)
        print(word)
    
    def sort_sentence(sentence):
        """Takes in a full sentence and returns the sorted words."""
        words = break_words(sentence)
        return sort_words(words)
    
    def print_first_and_last(sentence):
        """Prints the first and last words of the sentence."""
        words = break_words(sentence)
        print_first_word(words)
        print_last_word(words)
    
    def print_first_and_last_sorted(sentence):
        """Sorts the words then prints the first and last one."""
        words = sort_sentence(sentence)
        print_first_word(words)
        print_last_word(words)
    
    
    print("Let's practice everything.")
    print('You\'d need to know \'bout escapes with \\ that do \n newlines and \t tabs.')
    
    poem = """
    \tThe lovely world
    with logic so firmly planted
    cannot discern \n the needs of love
    nor comprehend passion from intuition
    and requires an explantion
    \n\t\twhere there is none.
    """
    
    
    print("--------------")
    print(poem)
    print("--------------")
    
    five = 10 - 2 + 3 - 5
    print("This should be five: %s" % five)
    
    def secret_formula(started):
        jelly_beans = started * 500
        jars = jelly_beans / 1000
        crates = jars / 100
        return jelly_beans, jars, crates
    
    
    start_point = 10000
    jelly_beans, jars, crates = secret_formula(start_point)
    
    print("With a starting point of: %d" % start_point)
    print("We'd have %d jeans, %d jars, and %d crates." % (jelly_beans, jars, crates))
    
    start_point = start_point / 10
    
    print("We can also do that this way:")
    print("We'd have %d beans, %d jars, and %d crabapples." % secret_formula(start_point))
    
    
    sentence = "All god\tthings come to those who weight."
    
    words = break_words(sentence)
    sorted_words = sort_words(words)
    
    print_first_word(words)
    print_last_word(words)
    print_first_word(sorted_words)
    print_last_word(sorted_words)
    sorted_words = sort_sentence(sentence)
    print(sorted_words)
    
    print_first_and_last(sentence)
    
    print_first_and_last_sorted(sentence)
    
    

    相关文章

      网友评论

        本文标题:【Python爬虫】--第二周_2作业

        本文链接:https://www.haomeiwen.com/subject/xejxlxtx.html