2016-03-21 11 views
0
import lxml 
from lxml import html 
import requests 
import re 
import csv 
with open('job.csv', 'wb') as csvfile: 
    a=csv.writer(csvfile) 
    a.writerow(["title","employer","salary","location"]) 
    for i in range(1): 
     url = "http://www.jobs-salary.com/salaries.php?q=illumina&ml=25&lc=&state=&company=&title=&sb=relevance&ps={}".format(i) 
     page = requests.get(url) 
     # print page.text 
     tree = html.fromstring(page.content) 
     for item in tree.xpath('//table[@class="resTb"]'): 

     # print tree.xpath('//table[@class="resTb"]//td/b/a/text()') 
     info = {} 
     info['title']=item.xpath('.//td/b/a/text()') 
     h = info['title'] 
     print h 

出力は、XPath pythonで縦に出力を私は取得しています

['Scientist I', 'Scientist', 'Scientist', 'Scientist', 'Biochemist', 'Scientist I', 'Biochemist', 'Scientist I', 'Scientist I', 'Biomedical Engineer', 'Biochemist', 'Fluidics Engineer', 'Biochemist And Biophysicists', 'Scientist I', 'Scientist I', 'Scientist', 'Scientist', 'Scientist I', 'Scientist I', 'Scientist II']

される印刷しかし、私は は誰が助けることができていない括弧やカンマで垂直にしたいですか?

答えて

1

リストを改行(\ n)で区切られた文字列として出力するだけです。 、

Scientist I 
Scientist 
Scientist 
Scientist 
Biochemist 
Scientist I 
Biochemist 
Scientist I 
Scientist I 
Biomedical Engineer 
Biochemist 
Fluidics Engineer 
Biochemist And Biophysicists 
Scientist I 
Scientist I 
Scientist 
Scientist 
Scientist I 
Scientist I 
Scientist II 
0

代わりのテーブルをitearting各行(table内部tr)を繰り返す:

h = ['Scientist I', 'Scientist', 'Scientist', 'Scientist', 'Biochemist', 'Scientist I', 'Biochemist', 'Scientist I', 'Scientist I', 'Biomedical Engineer', 'Biochemist', 'Fluidics Engineer', 'Biochemist And Biophysicists', 'Scientist I', 'Scientist I', 'Scientist', 'Scientist', 'Scientist I', 'Scientist I', 'Scientist II'] 
print('\n'.join(h)) 

出力を:あなたはあなたのリスト hjoinを呼び出すことによってこれを行うことができます。そして tdがそこにあるのを見つけてください。

from lxml import html 
import requests 
import csv 

url = "http://www.jobs-salary.com/salaries.php?q=illumina&ml=25&relevance&ps={}" 
with open('job.csv', 'wb') as csvfile: 
    a = csv.writer(csvfile) 
    a.writerow(["title", "employer", "salary", "location"]) 
    for i in range(1): 
     page = requests.get(url.format(i)) 
     tree = html.fromstring(page.content) 
     for item in tree.xpath('//table[@class="resTb"]/tr')[1:]: 
      row = [ 
       item.xpath('.//td[1]')[0].text_content(), # title 
       item.xpath('.//td[2]')[0].text_content(), # employer 
       item.xpath('.//td[3]')[0].text_content(), # salary 
       item.xpath('.//td[4]')[0].text_content(), # location 
      ] 
      print row 
      a.writerow(row) 
関連する問題