From 7360ffa3c90a1057d7eeb2b030977d95119b4e39 Mon Sep 17 00:00:00 2001 From: Ibrahim Serdar Acikgoz Date: Fri, 14 Jun 2019 14:57:53 +0300 Subject: [PATCH] Update README.md --- README.md | 34 +++++++++++++++++----------------- 1 file changed, 17 insertions(+), 17 deletions(-) diff --git a/README.md b/README.md index 3e8b777..3cea48b 100644 --- a/README.md +++ b/README.md @@ -1,5 +1,5 @@ # Geziyor -Geziyor is a blazing fast web crawling and web scraping framework, used to crawl websites and extract structured data from their pages. It can be used for a wide range of purposes, from data mining to monitoring and automated testing. +Geziyor is a blazing fast web crawling and web scraping framework. It can be used to crawl websites and extract structured data from them. Geziyor is useful for a wide range of purposes such as data mining, monitoring and automated testing. [![GoDoc](https://godoc.org/github.com/geziyor/geziyor?status.svg)](https://godoc.org/github.com/geziyor/geziyor) [![report card](https://goreportcard.com/badge/github.com/geziyor/geziyor)](http://goreportcard.com/report/geziyor/geziyor) @@ -16,7 +16,7 @@ Geziyor is a blazing fast web crawling and web scraping framework, used to crawl See scraper [Options](https://godoc.org/github.com/geziyor/geziyor#Options) for all custom settings. ## Status -We highly recommend you to use go modules. As this project is in **development stage** right now and **API is not stable**. +Since the project is in **development phase**, **API may change in time**. Also, we highly recommend you to use Geziyor with go modules. ## Usage Simple usage @@ -34,27 +34,27 @@ Advanced usage ```go func main() { - geziyor.NewGeziyor(geziyor.Options{ - StartURLs: []string{"http://quotes.toscrape.com/"}, - ParseFunc: quotesParse, - Exporters: []geziyor.Exporter{exporter.JSONExporter{}}, - }).Start() + geziyor.NewGeziyor(geziyor.Options{ + StartURLs: []string{"http://quotes.toscrape.com/"}, + ParseFunc: quotesParse, + Exporters: []geziyor.Exporter{exporter.JSONExporter{}}, + }).Start() } func quotesParse(r *geziyor.Response) { - r.DocHTML.Find("div.quote").Each(func(i int, s *goquery.Selection) { - r.Exports <- map[string]interface{}{ - "text": s.Find("span.text").Text(), - "author": s.Find("small.author").Text(), - } - }) - if href, ok := r.DocHTML.Find("li.next > a").Attr("href"); ok { - go r.Geziyor.Get(r.JoinURL(href), quotesParse) - } + r.DocHTML.Find("div.quote").Each(func(i int, s *goquery.Selection) { + r.Exports <- map[string]interface{}{ + "text": s.Find("span.text").Text(), + "author": s.Find("small.author").Text(), + } + }) + if href, ok := r.DocHTML.Find("li.next > a").Attr("href"); ok { + go r.Geziyor.Get(r.JoinURL(href), quotesParse) + } } ``` -See [tests](https://github.com/geziyor/geziyor/blob/master/geziyor_test.go) for more usage examples +See [tests](https://github.com/geziyor/geziyor/blob/master/geziyor_test.go) for more usage examples. ## Installation