Skip to content

Commit

Permalink
Optimized
Browse files Browse the repository at this point in the history
  • Loading branch information
Sakthe-Balan committed Apr 7, 2024
1 parent e75ec7c commit 5b36fa7
Show file tree
Hide file tree
Showing 6 changed files with 6 additions and 79 deletions.
File renamed without changes.
41 changes: 0 additions & 41 deletions server/chunk.py

This file was deleted.

12 changes: 6 additions & 6 deletions server/dino/dino/spiders/spider2.py
Original file line number Diff line number Diff line change
Expand Up @@ -1730,9 +1730,9 @@ def parse_software_page(self, response):
print(software_sections,"ss")
for section in software_sections:
software_info = {
'name': section.css('a.d-flex.align-items-center.ga_track_soft_name::text').get(),
'rating': section.css('span.star_new_background::text').get(),
'logo_href': section.css('img.soft_logo.ls-is-cached.lazyloaded::attr(src)').get(),
'title': section.css('a.d-flex.align-items-center.ga_track_soft_name::text').get(),
'price': section.css('span.star_new_background::text').get(),
'image_url': section.css('img.soft_logo.ls-is-cached.lazyloaded::attr(src)').get(),
'profile_href': section.css('a.ga_track_soft_profile.view_profile_inline::attr(href)').get(),
'website':section.css('a.ga_track_vwl_vwb.ripple_btn.cat_vwbft_fdfcgp_btn.vwb_btn.d-flex.align-items-center.justify-content-center::attr(href)')[0].get()
}
Expand All @@ -1747,12 +1747,12 @@ def parse_software_page(self, response):
def parse_software_profile(self, response):
software_info = response.meta['software_info']
# Extract the overview
software_info['logo_href']=response.xpath('//img[not(@class)]')[2].attrib.get('src', None)
software_info['overview'] = response.css('p.read_more_text_overview::text').get()
software_info['image_url']=response.xpath('//img[not(@class)]')[2].attrib.get('src', None)
software_info['description'] = response.css('p.read_more_text_overview::text').get()

# Extract the overall review

software_info['main_review_headings'] = response.xpath("//h3[@class='main_review_heading_main'][position() <= 3]/text()").getall()
software_info['reviews'] = response.xpath("//h3[@class='main_review_heading_main'][position() <= 3]/text()").getall()

print(software_info)

Expand Down
25 changes: 0 additions & 25 deletions server/outputs.json

This file was deleted.

Empty file removed server/scrapers.txt
Empty file.
7 changes: 0 additions & 7 deletions server/test.py

This file was deleted.

0 comments on commit 5b36fa7

Please sign in to comment.