forked from ukamnya/microdata_mirror
		
	Mad Microdata and Item fields public
This commit is contained in:
		
							parent
							
								
									da8a656b05
								
							
						
					
					
						commit
						ffada1099e
					
				
							
								
								
									
										33
									
								
								README.md
									
									
									
									
									
								
							
							
						
						
									
										33
									
								
								README.md
									
									
									
									
									
								
							| @ -1 +1,34 @@ | |||||||
| microdata - a microdata parser in Go | microdata - a microdata parser in Go | ||||||
|  | 
 | ||||||
|  | INSTALLATION | ||||||
|  | ============ | ||||||
|  | 
 | ||||||
|  | Simply run | ||||||
|  | 
 | ||||||
|  | 	go get github.com/iand/microdata | ||||||
|  | 
 | ||||||
|  | Documentation is at [http://go.pkgdoc.org/github.com/iand/microdata](http://go.pkgdoc.org/github.com/iand/microdata) | ||||||
|  | 
 | ||||||
|  | 
 | ||||||
|  | USAGE | ||||||
|  | ===== | ||||||
|  | 
 | ||||||
|  | Example of parsing a string containing HTML: | ||||||
|  | 
 | ||||||
|  | 	include ( | ||||||
|  | 		"net/url" | ||||||
|  | 		"strings" | ||||||
|  | 	) | ||||||
|  | 	html = `<div itemscope> | ||||||
|  | 	 <p>My name is <span itemprop="name">Elizabeth</span>.</p> | ||||||
|  | 	</div>` | ||||||
|  | 
 | ||||||
|  | 	baseUrl, _ := url.Parse("http://example.com/") | ||||||
|  | 	p := NewParser(strings.NewReader(html), baseUrl) | ||||||
|  | 
 | ||||||
|  | 	data, err := p.Parse() | ||||||
|  | 	if err != nil { | ||||||
|  | 		t.Errorf("Expected no error but got %d", err) | ||||||
|  | 	} | ||||||
|  | 
 | ||||||
|  | 	println("Name: ", data.items[0].properties["name"][0] | ||||||
							
								
								
									
										42
									
								
								microdata.go
									
									
									
									
									
								
							
							
						
						
									
										42
									
								
								microdata.go
									
									
									
									
									
								
							| @ -12,47 +12,49 @@ type ValueList []interface{} | |||||||
| type PropertyMap map[string]ValueList | type PropertyMap map[string]ValueList | ||||||
| 
 | 
 | ||||||
| type Item struct { | type Item struct { | ||||||
| 	properties PropertyMap | 	Properties PropertyMap | ||||||
| 	types      []string | 	Types      []string | ||||||
| 	id         string | 	ID         string | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| func NewItem() *Item { | func NewItem() *Item { | ||||||
| 	return &Item{ | 	return &Item{ | ||||||
| 		properties: make(PropertyMap, 0), | 		Properties: make(PropertyMap, 0), | ||||||
| 		types:      make([]string, 0), | 		Types:      make([]string, 0), | ||||||
| 	} | 	} | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| func (self *Item) SetString(property string, value string) { | func (self *Item) SetString(property string, value string) { | ||||||
| 	self.properties[property] = append(self.properties[property], value) | 	self.Properties[property] = append(self.Properties[property], value) | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| func (self *Item) SetItem(property string, value *Item) { | func (self *Item) SetItem(property string, value *Item) { | ||||||
| 	self.properties[property] = append(self.properties[property], value) | 	self.Properties[property] = append(self.Properties[property], value) | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| 
 | 
 | ||||||
| type Microdata struct { | type Microdata struct { | ||||||
| 	items []*Item | 	Items []*Item | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| func NewMicrodata() *Microdata { | func NewMicrodata() *Microdata { | ||||||
| 	return &Microdata{ | 	return &Microdata{ | ||||||
| 		items: make([]*Item, 0), | 		Items: make([]*Item, 0), | ||||||
| 	} | 	} | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| type Parser struct { | type Parser struct { | ||||||
| 	p               *h5.Parser | 	p               *h5.Parser | ||||||
| 	data            *Microdata | 	data            *Microdata | ||||||
|  | 	base 			*url.URL | ||||||
| 	identifiedNodes map[string]*h5.Node | 	identifiedNodes map[string]*h5.Node | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| func NewParser(r io.Reader, url.URL) *Parser { | func NewParser(r io.Reader, base *url.URL) *Parser { | ||||||
| 	return &Parser{ | 	return &Parser{ | ||||||
| 		p:    h5.NewParser(r), | 		p:    h5.NewParser(r), | ||||||
| 		data: NewMicrodata(), | 		data: NewMicrodata(), | ||||||
|  | 		base: base, | ||||||
| 	} | 	} | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| @ -80,17 +82,19 @@ func (self *Parser) Parse() (*Microdata, error) { | |||||||
| 
 | 
 | ||||||
| 	for _, node := range topLevelItemNodes { | 	for _, node := range topLevelItemNodes { | ||||||
| 		item := NewItem() | 		item := NewItem() | ||||||
| 		self.data.items = append(self.data.items, item) | 		self.data.Items = append(self.data.Items, item) | ||||||
| 		if itemtypes, exists := getAttr("itemtype", node); exists { | 		if itemtypes, exists := getAttr("itemtype", node); exists { | ||||||
| 			for _, itemtype := range strings.Split(strings.TrimSpace(itemtypes), " ") { | 			for _, itemtype := range strings.Split(strings.TrimSpace(itemtypes), " ") { | ||||||
| 				itemtype = strings.TrimSpace(itemtype) | 				itemtype = strings.TrimSpace(itemtype) | ||||||
| 				if itemtype != "" { | 				if itemtype != "" { | ||||||
| 					item.types = append(item.types, itemtype) | 					item.Types = append(item.Types, itemtype) | ||||||
| 				} | 				} | ||||||
| 			} | 			} | ||||||
| 			// itemid only valid when itemscope and itemtype are both present | 			// itemid only valid when itemscope and itemtype are both present | ||||||
| 			if itemid, exists := getAttr("itemid", node); exists { | 			if itemid, exists := getAttr("itemid", node); exists { | ||||||
| 				item.id = strings.TrimSpace(itemid) | 				if parsedUrl, err := self.base.Parse(itemid); err == nil { | ||||||
|  | 					item.ID = parsedUrl.String() | ||||||
|  | 				} | ||||||
| 			} | 			} | ||||||
| 
 | 
 | ||||||
| 		} | 		} | ||||||
| @ -152,11 +156,16 @@ func (self *Parser) readItem(item *Item, node *h5.Node) { | |||||||
| 
 | 
 | ||||||
| 			case "img", "audio", "source", "video", "embed", "iframe", "track": | 			case "img", "audio", "source", "video", "embed", "iframe", "track": | ||||||
| 				if urlValue, exists := getAttr("src", node); exists { | 				if urlValue, exists := getAttr("src", node); exists { | ||||||
| 					propertyValue = urlValue | 					if parsedUrl, err := self.base.Parse(urlValue); err == nil { | ||||||
|  | 						propertyValue = parsedUrl.String() | ||||||
|  | 					} | ||||||
|  | 
 | ||||||
| 				} | 				} | ||||||
| 			case "a", "area", "link": | 			case "a", "area", "link": | ||||||
| 				if urlValue, exists := getAttr("href", node); exists { | 				if urlValue, exists := getAttr("href", node); exists { | ||||||
| 					propertyValue = urlValue | 					if parsedUrl, err := self.base.Parse(urlValue); err == nil { | ||||||
|  | 						propertyValue = parsedUrl.String() | ||||||
|  | 					} | ||||||
| 				} | 				} | ||||||
| 			case "data": | 			case "data": | ||||||
| 				if urlValue, exists := getAttr("value", node); exists { | 				if urlValue, exists := getAttr("value", node); exists { | ||||||
| @ -178,13 +187,14 @@ func (self *Parser) readItem(item *Item, node *h5.Node) { | |||||||
| 				propertyValue = text.String() | 				propertyValue = text.String() | ||||||
| 			} | 			} | ||||||
| 
 | 
 | ||||||
|  | 			if len(propertyValue) > 0 { | ||||||
| 				for _, propertyName := range strings.Split(strings.TrimSpace(itemprop), " ") { | 				for _, propertyName := range strings.Split(strings.TrimSpace(itemprop), " ") { | ||||||
| 					propertyName = strings.TrimSpace(propertyName) | 					propertyName = strings.TrimSpace(propertyName) | ||||||
| 					if propertyName != "" { | 					if propertyName != "" { | ||||||
| 						item.SetString(propertyName, propertyValue) | 						item.SetString(propertyName, propertyValue) | ||||||
| 					} | 					} | ||||||
| 				} | 				} | ||||||
| 
 | 			} | ||||||
| 
 | 
 | ||||||
| 		} | 		} | ||||||
| 
 | 
 | ||||||
|  | |||||||
| @ -1,12 +1,14 @@ | |||||||
| package microdata | package microdata | ||||||
| 
 | 
 | ||||||
| import ( | import ( | ||||||
|  | 	"net/url" | ||||||
| 	"strings" | 	"strings" | ||||||
| 	"testing" | 	"testing" | ||||||
| ) | ) | ||||||
| 
 | 
 | ||||||
| func ParseData(html string, t *testing.T) *Microdata { | func ParseData(html string, t *testing.T) *Microdata { | ||||||
| 	p := NewParser(strings.NewReader(html), url.URL("http://example.com/") | 	u, _ := url.Parse("http://example.com/") | ||||||
|  | 	p := NewParser(strings.NewReader(html), u) | ||||||
| 
 | 
 | ||||||
| 	data, err := p.Parse() | 	data, err := p.Parse() | ||||||
| 	if err != nil { | 	if err != nil { | ||||||
| @ -22,7 +24,7 @@ func ParseData(html string, t *testing.T) *Microdata { | |||||||
| 
 | 
 | ||||||
| func ParseOneItem(html string, t *testing.T) *Item { | func ParseOneItem(html string, t *testing.T) *Item { | ||||||
| 	data := ParseData(html, t) | 	data := ParseData(html, t) | ||||||
| 	return data.items[0] | 	return data.Items[0] | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| func TestParse(t *testing.T) { | func TestParse(t *testing.T) { | ||||||
| @ -33,7 +35,7 @@ func TestParse(t *testing.T) { | |||||||
| 
 | 
 | ||||||
| 	item := ParseOneItem(html, t) | 	item := ParseOneItem(html, t) | ||||||
| 
 | 
 | ||||||
| 	if item.properties["name"][0].(string) != "Elizabeth" { | 	if item.Properties["name"][0].(string) != "Elizabeth" { | ||||||
| 		t.Errorf("Property value not found") | 		t.Errorf("Property value not found") | ||||||
| 	} | 	} | ||||||
| 
 | 
 | ||||||
| @ -46,7 +48,7 @@ func TestParseActuallyParses(t *testing.T) { | |||||||
| 	</div>` | 	</div>` | ||||||
| 	item := ParseOneItem(html, t) | 	item := ParseOneItem(html, t) | ||||||
| 
 | 
 | ||||||
| 	if item.properties["name"][0].(string) != "Daniel" { | 	if item.Properties["name"][0].(string) != "Daniel" { | ||||||
| 		t.Errorf("Property value not found") | 		t.Errorf("Property value not found") | ||||||
| 	} | 	} | ||||||
| 
 | 
 | ||||||
| @ -62,15 +64,15 @@ func TestParseThreeProps(t *testing.T) { | |||||||
| 
 | 
 | ||||||
| 	item := ParseOneItem(html, t) | 	item := ParseOneItem(html, t) | ||||||
| 
 | 
 | ||||||
| 	if item.properties["name"][0].(string) != "Neil" { | 	if item.Properties["name"][0].(string) != "Neil" { | ||||||
| 		t.Errorf("Property value not found") | 		t.Errorf("Property value not found") | ||||||
| 	} | 	} | ||||||
| 
 | 
 | ||||||
| 	if item.properties["band"][0].(string) != "Four Parts Water" { | 	if item.Properties["band"][0].(string) != "Four Parts Water" { | ||||||
| 		t.Errorf("Property value not found") | 		t.Errorf("Property value not found") | ||||||
| 	} | 	} | ||||||
| 
 | 
 | ||||||
| 	if item.properties["nationality"][0].(string) != "British" { | 	if item.Properties["nationality"][0].(string) != "British" { | ||||||
| 		t.Errorf("Property value not found") | 		t.Errorf("Property value not found") | ||||||
| 	} | 	} | ||||||
| } | } | ||||||
| @ -78,12 +80,12 @@ func TestParseThreeProps(t *testing.T) { | |||||||
| func TestParseImgSrc(t *testing.T) { | func TestParseImgSrc(t *testing.T) { | ||||||
| 	html := ` | 	html := ` | ||||||
| 	<div itemscope> | 	<div itemscope> | ||||||
| 	 <img itemprop="image" src="google-logo.png" alt="Google"> | 	 <img itemprop="image" src="http://example.com/foo" alt="Google"> | ||||||
| 	</div>` | 	</div>` | ||||||
| 
 | 
 | ||||||
| 	item := ParseOneItem(html, t) | 	item := ParseOneItem(html, t) | ||||||
| 
 | 
 | ||||||
| 	if item.properties["image"][0].(string) != "google-logo.png" { | 	if item.Properties["image"][0].(string) != "http://example.com/foo" { | ||||||
| 		t.Errorf("Property value not found") | 		t.Errorf("Property value not found") | ||||||
| 	} | 	} | ||||||
| } | } | ||||||
| @ -91,12 +93,12 @@ func TestParseImgSrc(t *testing.T) { | |||||||
| func TestParseAHref(t *testing.T) { | func TestParseAHref(t *testing.T) { | ||||||
| 	html := ` | 	html := ` | ||||||
| 	<div itemscope> | 	<div itemscope> | ||||||
| 	 <a itemprop="image" href="google-logo.png">foo</a> | 	 <a itemprop="image" href="http://example.com/foo">foo</a> | ||||||
| 	</div>` | 	</div>` | ||||||
| 
 | 
 | ||||||
| 	item := ParseOneItem(html, t) | 	item := ParseOneItem(html, t) | ||||||
| 
 | 
 | ||||||
| 	if item.properties["image"][0].(string) != "google-logo.png" { | 	if item.Properties["image"][0].(string) != "http://example.com/foo" { | ||||||
| 		t.Errorf("Property value not found") | 		t.Errorf("Property value not found") | ||||||
| 	} | 	} | ||||||
| } | } | ||||||
| @ -104,13 +106,13 @@ func TestParseAHref(t *testing.T) { | |||||||
| func TestParseAreaHref(t *testing.T) { | func TestParseAreaHref(t *testing.T) { | ||||||
| 	html := ` | 	html := ` | ||||||
| 	<div itemscope><map name="shapes"> | 	<div itemscope><map name="shapes"> | ||||||
| 	 <area itemprop="foo" href="target.html" shape=rect coords="50,50,100,100"> | 	 <area itemprop="foo" href="http://example.com/foo" shape=rect coords="50,50,100,100"> | ||||||
| 	 | 	 | ||||||
| 	</map></div>` | 	</map></div>` | ||||||
| 
 | 
 | ||||||
| 	item := ParseOneItem(html, t) | 	item := ParseOneItem(html, t) | ||||||
| 
 | 
 | ||||||
| 	if item.properties["foo"][0].(string) != "target.html" { | 	if item.Properties["foo"][0].(string) != "http://example.com/foo" { | ||||||
| 		t.Errorf("Property value not found") | 		t.Errorf("Property value not found") | ||||||
| 	} | 	} | ||||||
| } | } | ||||||
| @ -118,12 +120,12 @@ func TestParseAreaHref(t *testing.T) { | |||||||
| func TestParseLinkHref(t *testing.T) { | func TestParseLinkHref(t *testing.T) { | ||||||
| 	html := ` | 	html := ` | ||||||
| 	<div itemscope> | 	<div itemscope> | ||||||
| 		<link itemprop="foo" rel="author" href="target.html"> | 		<link itemprop="foo" rel="author" href="http://example.com/foo"> | ||||||
| 	</div>` | 	</div>` | ||||||
| 
 | 
 | ||||||
| 	item := ParseOneItem(html, t) | 	item := ParseOneItem(html, t) | ||||||
| 
 | 
 | ||||||
| 	if item.properties["foo"][0].(string) != "target.html" { | 	if item.Properties["foo"][0].(string) != "http://example.com/foo" { | ||||||
| 		t.Errorf("Property value not found") | 		t.Errorf("Property value not found") | ||||||
| 	} | 	} | ||||||
| } | } | ||||||
| @ -131,12 +133,12 @@ func TestParseLinkHref(t *testing.T) { | |||||||
| func TestParseAudioSrc(t *testing.T) { | func TestParseAudioSrc(t *testing.T) { | ||||||
| 	html := ` | 	html := ` | ||||||
| 	<div itemscope> | 	<div itemscope> | ||||||
| 	 <audio itemprop="foo" src="target"></audio> | 	 <audio itemprop="foo" src="http://example.com/foo"></audio> | ||||||
| 	</div>` | 	</div>` | ||||||
| 
 | 
 | ||||||
| 	item := ParseOneItem(html, t) | 	item := ParseOneItem(html, t) | ||||||
| 
 | 
 | ||||||
| 	if item.properties["foo"][0].(string) != "target" { | 	if item.Properties["foo"][0].(string) != "http://example.com/foo" { | ||||||
| 		t.Errorf("Property value not found") | 		t.Errorf("Property value not found") | ||||||
| 	} | 	} | ||||||
| } | } | ||||||
| @ -144,12 +146,12 @@ func TestParseAudioSrc(t *testing.T) { | |||||||
| func TestParseSourceSrc(t *testing.T) { | func TestParseSourceSrc(t *testing.T) { | ||||||
| 	html := ` | 	html := ` | ||||||
| 	<div itemscope> | 	<div itemscope> | ||||||
| 	 <source itemprop="foo" src="target"></source> | 	 <source itemprop="foo" src="http://example.com/foo"></source> | ||||||
| 	</div>` | 	</div>` | ||||||
| 
 | 
 | ||||||
| 	item := ParseOneItem(html, t) | 	item := ParseOneItem(html, t) | ||||||
| 
 | 
 | ||||||
| 	if item.properties["foo"][0].(string) != "target" { | 	if item.Properties["foo"][0].(string) != "http://example.com/foo" { | ||||||
| 		t.Errorf("Property value not found") | 		t.Errorf("Property value not found") | ||||||
| 	} | 	} | ||||||
| } | } | ||||||
| @ -157,12 +159,12 @@ func TestParseSourceSrc(t *testing.T) { | |||||||
| func TestParseVideoSrc(t *testing.T) { | func TestParseVideoSrc(t *testing.T) { | ||||||
| 	html := ` | 	html := ` | ||||||
| 	<div itemscope> | 	<div itemscope> | ||||||
| 	 <video itemprop="foo" src="target"></video> | 	 <video itemprop="foo" src="http://example.com/foo"></video> | ||||||
| 	</div>` | 	</div>` | ||||||
| 
 | 
 | ||||||
| 	item := ParseOneItem(html, t) | 	item := ParseOneItem(html, t) | ||||||
| 
 | 
 | ||||||
| 	if item.properties["foo"][0].(string) != "target" { | 	if item.Properties["foo"][0].(string) != "http://example.com/foo" { | ||||||
| 		t.Errorf("Property value not found") | 		t.Errorf("Property value not found") | ||||||
| 	} | 	} | ||||||
| } | } | ||||||
| @ -170,12 +172,12 @@ func TestParseVideoSrc(t *testing.T) { | |||||||
| func TestParseEmbedSrc(t *testing.T) { | func TestParseEmbedSrc(t *testing.T) { | ||||||
| 	html := ` | 	html := ` | ||||||
| 	<div itemscope> | 	<div itemscope> | ||||||
| 	 <embed itemprop="foo" src="target"></embed> | 	 <embed itemprop="foo" src="http://example.com/foo"></embed> | ||||||
| 	</div>` | 	</div>` | ||||||
| 
 | 
 | ||||||
| 	item := ParseOneItem(html, t) | 	item := ParseOneItem(html, t) | ||||||
| 
 | 
 | ||||||
| 	if item.properties["foo"][0].(string) != "target" { | 	if item.Properties["foo"][0].(string) != "http://example.com/foo" { | ||||||
| 		t.Errorf("Property value not found") | 		t.Errorf("Property value not found") | ||||||
| 	} | 	} | ||||||
| } | } | ||||||
| @ -183,12 +185,12 @@ func TestParseEmbedSrc(t *testing.T) { | |||||||
| func TestParseTrackSrc(t *testing.T) { | func TestParseTrackSrc(t *testing.T) { | ||||||
| 	html := ` | 	html := ` | ||||||
| 	<div itemscope> | 	<div itemscope> | ||||||
| 	 <track itemprop="foo" src="target"></track> | 	 <track itemprop="foo" src="http://example.com/foo"></track> | ||||||
| 	</div>` | 	</div>` | ||||||
| 
 | 
 | ||||||
| 	item := ParseOneItem(html, t) | 	item := ParseOneItem(html, t) | ||||||
| 
 | 
 | ||||||
| 	if item.properties["foo"][0].(string) != "target" { | 	if item.Properties["foo"][0].(string) != "http://example.com/foo" { | ||||||
| 		t.Errorf("Property value not found") | 		t.Errorf("Property value not found") | ||||||
| 	} | 	} | ||||||
| } | } | ||||||
| @ -196,12 +198,12 @@ func TestParseTrackSrc(t *testing.T) { | |||||||
| func TestParseIFrameSrc(t *testing.T) { | func TestParseIFrameSrc(t *testing.T) { | ||||||
| 	html := ` | 	html := ` | ||||||
| 	<div itemscope> | 	<div itemscope> | ||||||
| 	 <iframe itemprop="foo" src="target"></iframe> | 	 <iframe itemprop="foo" src="http://example.com/foo"></iframe> | ||||||
| 	</div>` | 	</div>` | ||||||
| 
 | 
 | ||||||
| 	item := ParseOneItem(html, t) | 	item := ParseOneItem(html, t) | ||||||
| 
 | 
 | ||||||
| 	if item.properties["foo"][0].(string) != "target" { | 	if item.Properties["foo"][0].(string) != "http://example.com/foo" { | ||||||
| 		t.Errorf("Property value not found") | 		t.Errorf("Property value not found") | ||||||
| 	} | 	} | ||||||
| } | } | ||||||
| @ -214,7 +216,7 @@ func TestParseDataValue(t *testing.T) { | |||||||
| 
 | 
 | ||||||
| 	item := ParseOneItem(html, t) | 	item := ParseOneItem(html, t) | ||||||
| 
 | 
 | ||||||
| 	if item.properties["product-id"][0].(string) != "9678AOU879" { | 	if item.Properties["product-id"][0].(string) != "9678AOU879" { | ||||||
| 		t.Errorf("Property value not found") | 		t.Errorf("Property value not found") | ||||||
| 	} | 	} | ||||||
| } | } | ||||||
| @ -227,7 +229,7 @@ func TestParseTimeDatetime(t *testing.T) { | |||||||
| 
 | 
 | ||||||
| 	item := ParseOneItem(html, t) | 	item := ParseOneItem(html, t) | ||||||
| 
 | 
 | ||||||
| 	if item.properties["birthday"][0].(string) != "2009-05-10" { | 	if item.Properties["birthday"][0].(string) != "2009-05-10" { | ||||||
| 		t.Errorf("Property value not found") | 		t.Errorf("Property value not found") | ||||||
| 	} | 	} | ||||||
| } | } | ||||||
| @ -243,13 +245,13 @@ func TestParseTwoValues(t *testing.T) { | |||||||
| 	</div>` | 	</div>` | ||||||
| 
 | 
 | ||||||
| 	item := ParseOneItem(html, t) | 	item := ParseOneItem(html, t) | ||||||
| 	if len(item.properties["flavor"]) != 2 { | 	if len(item.Properties["flavor"]) != 2 { | ||||||
| 		t.Errorf("Expecting 2 values but got %d", len(item.properties["flavor"])) | 		t.Errorf("Expecting 2 values but got %d", len(item.Properties["flavor"])) | ||||||
| 	} | 	} | ||||||
| 	if item.properties["flavor"][0].(string) != "Lemon sorbet" { | 	if item.Properties["flavor"][0].(string) != "Lemon sorbet" { | ||||||
| 		t.Errorf("Property value 'Lemon sorbet' not found") | 		t.Errorf("Property value 'Lemon sorbet' not found") | ||||||
| 	} | 	} | ||||||
| 	if item.properties["flavor"][1].(string) != "Apricot sorbet" { | 	if item.Properties["flavor"][1].(string) != "Apricot sorbet" { | ||||||
| 		t.Errorf("Property value 'Apricot sorbet' not found") | 		t.Errorf("Property value 'Apricot sorbet' not found") | ||||||
| 	} | 	} | ||||||
| 
 | 
 | ||||||
| @ -262,19 +264,19 @@ func TestParseTwoPropertiesOneValue(t *testing.T) { | |||||||
| 	</div>` | 	</div>` | ||||||
| 
 | 
 | ||||||
| 	item := ParseOneItem(html, t) | 	item := ParseOneItem(html, t) | ||||||
| 	if len(item.properties) != 2 { | 	if len(item.Properties) != 2 { | ||||||
| 		t.Errorf("Expecting 2 properties but got %d", len(item.properties)) | 		t.Errorf("Expecting 2 properties but got %d", len(item.Properties)) | ||||||
| 	} | 	} | ||||||
| 	if len(item.properties["favorite-color"]) != 1 { | 	if len(item.Properties["favorite-color"]) != 1 { | ||||||
| 		t.Errorf("Expecting 1 value but got %d", len(item.properties["favorite-color"])) | 		t.Errorf("Expecting 1 value but got %d", len(item.Properties["favorite-color"])) | ||||||
| 	} | 	} | ||||||
| 	if len(item.properties["favorite-fruit"]) != 1 { | 	if len(item.Properties["favorite-fruit"]) != 1 { | ||||||
| 		t.Errorf("Expecting 1 value but got %d", len(item.properties["favorite-fruit"])) | 		t.Errorf("Expecting 1 value but got %d", len(item.Properties["favorite-fruit"])) | ||||||
| 	} | 	} | ||||||
| 	if item.properties["favorite-color"][0].(string) != "orange" { | 	if item.Properties["favorite-color"][0].(string) != "orange" { | ||||||
| 		t.Errorf("Property value 'orange' not found for 'favorite-color'") | 		t.Errorf("Property value 'orange' not found for 'favorite-color'") | ||||||
| 	} | 	} | ||||||
| 	if item.properties["favorite-fruit"][0].(string) != "orange" { | 	if item.Properties["favorite-fruit"][0].(string) != "orange" { | ||||||
| 		t.Errorf("Property value 'orange' not found for 'favorite-fruit'") | 		t.Errorf("Property value 'orange' not found for 'favorite-fruit'") | ||||||
| 	} | 	} | ||||||
| } | } | ||||||
| @ -286,20 +288,20 @@ func TestParseTwoPropertiesOneValueMultispaced(t *testing.T) { | |||||||
| 	</div>` | 	</div>` | ||||||
| 
 | 
 | ||||||
| 	item := ParseOneItem(html, t) | 	item := ParseOneItem(html, t) | ||||||
| 	if len(item.properties) != 2 { | 	if len(item.Properties) != 2 { | ||||||
| 		t.Errorf("Expecting 2 properties but got %d", len(item.properties)) | 		t.Errorf("Expecting 2 properties but got %d", len(item.Properties)) | ||||||
| 	} | 	} | ||||||
| 
 | 
 | ||||||
| 	if len(item.properties["favorite-color"]) != 1 { | 	if len(item.Properties["favorite-color"]) != 1 { | ||||||
| 		t.Errorf("Expecting 1 value but got %d", len(item.properties["favorite-color"])) | 		t.Errorf("Expecting 1 value but got %d", len(item.Properties["favorite-color"])) | ||||||
| 	} | 	} | ||||||
| 	if len(item.properties["favorite-fruit"]) != 1 { | 	if len(item.Properties["favorite-fruit"]) != 1 { | ||||||
| 		t.Errorf("Expecting 1 value but got %d", len(item.properties["favorite-fruit"])) | 		t.Errorf("Expecting 1 value but got %d", len(item.Properties["favorite-fruit"])) | ||||||
| 	} | 	} | ||||||
| 	if item.properties["favorite-color"][0].(string) != "orange" { | 	if item.Properties["favorite-color"][0].(string) != "orange" { | ||||||
| 		t.Errorf("Property value 'orange' not found for 'favorite-color'") | 		t.Errorf("Property value 'orange' not found for 'favorite-color'") | ||||||
| 	} | 	} | ||||||
| 	if item.properties["favorite-fruit"][0].(string) != "orange" { | 	if item.Properties["favorite-fruit"][0].(string) != "orange" { | ||||||
| 		t.Errorf("Property value 'orange' not found for 'favorite-fruit'") | 		t.Errorf("Property value 'orange' not found for 'favorite-fruit'") | ||||||
| 	} | 	} | ||||||
| } | } | ||||||
| @ -311,12 +313,12 @@ func TestParseItemType(t *testing.T) { | |||||||
| 	</div>` | 	</div>` | ||||||
| 
 | 
 | ||||||
| 	item := ParseOneItem(html, t) | 	item := ParseOneItem(html, t) | ||||||
| 	if len(item.types) != 1 { | 	if len(item.Types) != 1 { | ||||||
| 		t.Errorf("Expecting 1 type but got %d", len(item.types)) | 		t.Errorf("Expecting 1 type but got %d", len(item.Types)) | ||||||
| 	} | 	} | ||||||
| 
 | 
 | ||||||
| 	if item.types[0] != "http://example.org/animals#cat" { | 	if item.Types[0] != "http://example.org/animals#cat" { | ||||||
| 		t.Errorf("Expecting type of 'http://example.org/animals#cat' but got %d", item.types[0]) | 		t.Errorf("Expecting type of 'http://example.org/animals#cat' but got %d", item.Types[0]) | ||||||
| 	} | 	} | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| @ -327,15 +329,15 @@ func TestParseMultipleItemTypes(t *testing.T) { | |||||||
| 	</div>` | 	</div>` | ||||||
| 
 | 
 | ||||||
| 	item := ParseOneItem(html, t) | 	item := ParseOneItem(html, t) | ||||||
| 	if len(item.types) != 2 { | 	if len(item.Types) != 2 { | ||||||
| 		t.Errorf("Expecting 2 types but got %d", len(item.types)) | 		t.Errorf("Expecting 2 types but got %d", len(item.Types)) | ||||||
| 	} | 	} | ||||||
| 
 | 
 | ||||||
| 	if item.types[0] != "http://example.org/animals#mammal" { | 	if item.Types[0] != "http://example.org/animals#mammal" { | ||||||
| 		t.Errorf("Expecting type of 'http://example.org/animals#mammal' but got %d", item.types[0]) | 		t.Errorf("Expecting type of 'http://example.org/animals#mammal' but got %d", item.Types[0]) | ||||||
| 	} | 	} | ||||||
| 	if item.types[1] != "http://example.org/animals#cat" { | 	if item.Types[1] != "http://example.org/animals#cat" { | ||||||
| 		t.Errorf("Expecting type of 'http://example.org/animals#cat' but got %d", item.types[1]) | 		t.Errorf("Expecting type of 'http://example.org/animals#cat' but got %d", item.Types[1]) | ||||||
| 	} | 	} | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| @ -353,8 +355,8 @@ func TestParseItemId(t *testing.T) { | |||||||
| 
 | 
 | ||||||
| 	item := ParseOneItem(html, t) | 	item := ParseOneItem(html, t) | ||||||
| 
 | 
 | ||||||
| 	if item.id != "urn:isbn:0-330-34032-8" { | 	if item.ID != "urn:isbn:0-330-34032-8" { | ||||||
| 		t.Errorf("Expecting id of 'urn:isbn:0-330-34032-8' but got %d", item.id) | 		t.Errorf("Expecting id of 'urn:isbn:0-330-34032-8' but got %d", item.ID) | ||||||
| 	} | 	} | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| @ -369,11 +371,11 @@ func TestParseItemRef(t *testing.T) { | |||||||
| 
 | 
 | ||||||
| 	item := ParseOneItem(html, t) | 	item := ParseOneItem(html, t) | ||||||
| 
 | 
 | ||||||
| 	if len(item.properties) != 3 { | 	if len(item.Properties) != 3 { | ||||||
| 		t.Errorf("Expecting 3 properties but got %d", len(item.properties)) | 		t.Errorf("Expecting 3 properties but got %d", len(item.Properties)) | ||||||
| 	} | 	} | ||||||
| 
 | 
 | ||||||
| 	if item.properties["license"][0].(string) != "http://www.opensource.org/licenses/mit-license.php" { | 	if item.Properties["license"][0].(string) != "http://www.opensource.org/licenses/mit-license.php" { | ||||||
| 		t.Errorf("Property value 'http://www.opensource.org/licenses/mit-license.php' not found for 'license'") | 		t.Errorf("Property value 'http://www.opensource.org/licenses/mit-license.php' not found for 'license'") | ||||||
| 	} | 	} | ||||||
| 
 | 
 | ||||||
| @ -405,21 +407,21 @@ func TestParseSharedItemRef(t *testing.T) { | |||||||
| 
 | 
 | ||||||
| 	data := ParseData(html, t) | 	data := ParseData(html, t) | ||||||
| 
 | 
 | ||||||
| 	if len(data.items) != 2 { | 	if len(data.Items) != 2 { | ||||||
| 		t.Errorf("Expecting 2 items but got %d", len(data.items)) | 		t.Errorf("Expecting 2 items but got %d", len(data.Items)) | ||||||
| 	} | 	} | ||||||
| 	if len(data.items[0].properties) != 3 { | 	if len(data.Items[0].Properties) != 3 { | ||||||
| 		t.Errorf("Expecting 3 properties but got %d", len(data.items[0].properties)) | 		t.Errorf("Expecting 3 properties but got %d", len(data.Items[0].Properties)) | ||||||
| 	} | 	} | ||||||
| 	if len(data.items[1].properties) != 3 { | 	if len(data.Items[1].Properties) != 3 { | ||||||
| 		t.Errorf("Expecting 3 properties but got %d", len(data.items[1].properties)) | 		t.Errorf("Expecting 3 properties but got %d", len(data.Items[1].Properties)) | ||||||
| 	} | 	} | ||||||
| 
 | 
 | ||||||
| 	if data.items[0].properties["license"][0].(string) != "http://www.opensource.org/licenses/mit-license.php" { | 	if data.Items[0].Properties["license"][0].(string) != "http://www.opensource.org/licenses/mit-license.php" { | ||||||
| 		t.Errorf("Property value 'http://www.opensource.org/licenses/mit-license.php' not found for 'license'") | 		t.Errorf("Property value 'http://www.opensource.org/licenses/mit-license.php' not found for 'license'") | ||||||
| 	} | 	} | ||||||
| 
 | 
 | ||||||
| 	if data.items[1].properties["license"][0].(string) != "http://www.opensource.org/licenses/mit-license.php" { | 	if data.Items[1].Properties["license"][0].(string) != "http://www.opensource.org/licenses/mit-license.php" { | ||||||
| 		t.Errorf("Property value 'http://www.opensource.org/licenses/mit-license.php' not found for 'license'") | 		t.Errorf("Property value 'http://www.opensource.org/licenses/mit-license.php' not found for 'license'") | ||||||
| 	} | 	} | ||||||
| 
 | 
 | ||||||
| @ -438,11 +440,11 @@ func TestParseMultiValuedItemRef(t *testing.T) { | |||||||
| 
 | 
 | ||||||
| 	data := ParseData(html, t) | 	data := ParseData(html, t) | ||||||
| 
 | 
 | ||||||
| 	if data.items[0].properties["name"][0].(string) != "Amanda" { | 	if data.Items[0].Properties["name"][0].(string) != "Amanda" { | ||||||
| 		t.Errorf("Property value 'Amanda' not found for 'name'") | 		t.Errorf("Property value 'Amanda' not found for 'name'") | ||||||
| 	} | 	} | ||||||
| 
 | 
 | ||||||
| 	if data.items[0].properties["age"][0].(string) != "26" { | 	if data.Items[0].Properties["age"][0].(string) != "26" { | ||||||
| 		t.Errorf("Property value '26' not found for 'age'") | 		t.Errorf("Property value '26' not found for 'age'") | ||||||
| 	} | 	} | ||||||
| } | } | ||||||
| @ -456,18 +458,18 @@ func TestParseEmbeddedItem(t *testing.T) { | |||||||
| 
 | 
 | ||||||
| 	data := ParseData(html, t) | 	data := ParseData(html, t) | ||||||
| 
 | 
 | ||||||
| 	if len(data.items) != 1 { | 	if len(data.Items) != 1 { | ||||||
| 		t.Errorf("Expecting 1 item but got %d", len(data.items)) | 		t.Errorf("Expecting 1 item but got %d", len(data.Items)) | ||||||
| 	} | 	} | ||||||
| 
 | 
 | ||||||
| 
 | 
 | ||||||
| 	if data.items[0].properties["name"][0].(string) != "Amanda" { | 	if data.Items[0].Properties["name"][0].(string) != "Amanda" { | ||||||
| 		t.Errorf("Property value 'Amanda' not found for 'name'") | 		t.Errorf("Property value 'Amanda' not found for 'name'") | ||||||
| 	} | 	} | ||||||
| 
 | 
 | ||||||
| 	subitem := data.items[0].properties["band"][0].(*Item) | 	subitem := data.Items[0].Properties["band"][0].(*Item) | ||||||
| 
 | 
 | ||||||
| 	if subitem.properties["name"][0].(string) != "Jazz Band" { | 	if subitem.Properties["name"][0].(string) != "Jazz Band" { | ||||||
| 		t.Errorf("Property value 'Jazz Band' not found for 'name'") | 		t.Errorf("Property value 'Jazz Band' not found for 'name'") | ||||||
| 	} | 	} | ||||||
| } | } | ||||||
| @ -484,19 +486,52 @@ func TestParseEmbeddedItemWithItemRef(t *testing.T) { | |||||||
| 
 | 
 | ||||||
| 	data := ParseData(html, t) | 	data := ParseData(html, t) | ||||||
| 
 | 
 | ||||||
| 	if len(data.items) != 1 { | 	if len(data.Items) != 1 { | ||||||
| 		t.Errorf("Expecting 1 item but got %d", len(data.items)) | 		t.Errorf("Expecting 1 item but got %d", len(data.Items)) | ||||||
| 	} | 	} | ||||||
| 
 | 
 | ||||||
| 
 | 
 | ||||||
| 	if data.items[0].properties["name"][0].(string) != "Amanda" { | 	if data.Items[0].Properties["name"][0].(string) != "Amanda" { | ||||||
| 		t.Errorf("Property value 'Amanda' not found for 'name'") | 		t.Errorf("Property value 'Amanda' not found for 'name'") | ||||||
| 	} | 	} | ||||||
| 
 | 
 | ||||||
| 	subitem := data.items[0].properties["band"][0].(*Item) | 	subitem := data.Items[0].Properties["band"][0].(*Item) | ||||||
| 
 | 
 | ||||||
| 	if subitem.properties["name"][0].(string) != "Jazz Band" { | 	if subitem.Properties["name"][0].(string) != "Jazz Band" { | ||||||
| 		t.Errorf("Property value 'Jazz Band' not found for 'name'") | 		t.Errorf("Property value 'Jazz Band' not found for 'name'") | ||||||
| 	} | 	} | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
|  | 
 | ||||||
|  | 
 | ||||||
|  | func TestParseRelativeURL(t *testing.T) { | ||||||
|  | 	html := ` | ||||||
|  | 	<div itemscope> | ||||||
|  | 	 <a itemprop="image" href="test.png">foo</a> | ||||||
|  | 	</div>` | ||||||
|  | 
 | ||||||
|  | 	item := ParseOneItem(html, t) | ||||||
|  | 
 | ||||||
|  | 	if item.Properties["image"][0].(string) != "http://example.com/test.png" { | ||||||
|  | 		t.Errorf("Property value not found") | ||||||
|  | 	} | ||||||
|  | } | ||||||
|  | 
 | ||||||
|  | func TestParseItemRelativeId(t *testing.T) { | ||||||
|  | 	html := `<dl itemscope | ||||||
|  | 	    itemtype="http://vocab.example.net/book" | ||||||
|  | 	    itemid="foo"> | ||||||
|  | 	 <dt>Title | ||||||
|  | 	 <dd itemprop="title">The Reality Dysfunction | ||||||
|  | 	 <dt>Author | ||||||
|  | 	 <dd itemprop="author">Peter F. Hamilton | ||||||
|  | 	 <dt>Publication date | ||||||
|  | 	 <dd><time itemprop="pubdate" datetime="1996-01-26">26 January 1996</time> | ||||||
|  | 	</dl>` | ||||||
|  | 
 | ||||||
|  | 	item := ParseOneItem(html, t) | ||||||
|  | 
 | ||||||
|  | 	if item.ID != "http://example.com/foo" { | ||||||
|  | 		t.Errorf("Expecting id of 'http://example.com/foo' but got %d", item.ID) | ||||||
|  | 	} | ||||||
|  | } | ||||||
|  | |||||||
		Loading…
	
	
			
			x
			
			
		
	
		Reference in New Issue
	
	Block a user