0
|
1 <?xml version="1.0" encoding="UTF-8"?>
|
|
2 <!--
|
|
3 Licensed to the Apache Software Foundation (ASF) under one or more
|
|
4 contributor license agreements. See the NOTICE file distributed with
|
|
5 this work for additional information regarding copyright ownership.
|
|
6 The ASF licenses this file to You under the Apache License, Version 2.0
|
|
7 (the "License"); you may not use this file except in compliance with
|
|
8 the License. You may obtain a copy of the License at
|
|
9
|
|
10 http://www.apache.org/licenses/LICENSE-2.0
|
|
11
|
|
12 Unless required by applicable law or agreed to in writing, software
|
|
13 distributed under the License is distributed on an "AS IS" BASIS,
|
|
14 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
15 See the License for the specific language governing permissions and
|
|
16 limitations under the License.
|
|
17 -->
|
|
18
|
|
19 <!--
|
|
20 Document : domain-suffixes.xsd
|
|
21 Author : Enis Soztutar - enis.soz.nutch@gmail.com
|
|
22 Description: This document is the schema for valid domain-suffixes
|
|
23 definitions. For successful parsing of domain-suffixes xml files,
|
|
24 the xml file should be validated with this xsd.
|
|
25 See : org.apache.nutch.util.domain.DomainSuffixesReader.java
|
|
26 -->
|
|
27
|
|
28 <xs:schema xmlns:xs="http://www.w3.org/2001/XMLSchema"
|
|
29 targetNamespace="http://lucene.apache.org/nutch"
|
|
30 xmlns="http://lucene.apache.org/nutch"
|
|
31 elementFormDefault="qualified">
|
|
32
|
|
33 <xs:element name="domains">
|
|
34 <xs:complexType>
|
|
35 <xs:sequence>
|
|
36 <xs:element name="tlds">
|
|
37 <xs:complexType>
|
|
38 <xs:sequence>
|
|
39 <xs:element name="itlds">
|
|
40 <xs:complexType>
|
|
41 <xs:sequence>
|
|
42 <xs:element name="tld" maxOccurs="unbounded"
|
|
43 type="gtld" />
|
|
44 </xs:sequence>
|
|
45 </xs:complexType>
|
|
46 </xs:element>
|
|
47
|
|
48 <xs:element name="gtlds">
|
|
49 <xs:complexType>
|
|
50 <xs:sequence>
|
|
51 <xs:element name="tld" maxOccurs="unbounded"
|
|
52 type="gtld" />
|
|
53 </xs:sequence>
|
|
54 </xs:complexType>
|
|
55 </xs:element>
|
|
56
|
|
57 <xs:element name="cctlds">
|
|
58 <xs:complexType>
|
|
59 <xs:sequence>
|
|
60 <xs:element name="tld" maxOccurs="unbounded"
|
|
61 type="cctld" />
|
|
62 </xs:sequence>
|
|
63 </xs:complexType>
|
|
64 </xs:element>
|
|
65
|
|
66 </xs:sequence>
|
|
67 </xs:complexType>
|
|
68 </xs:element>
|
|
69
|
|
70 <xs:element name="suffixes">
|
|
71 <xs:complexType>
|
|
72 <xs:sequence>
|
|
73 <xs:element name="suffix" maxOccurs="unbounded"
|
|
74 type="sldType" />
|
|
75 </xs:sequence>
|
|
76 </xs:complexType>
|
|
77 </xs:element>
|
|
78 </xs:sequence>
|
|
79 </xs:complexType>
|
|
80 </xs:element>
|
|
81
|
|
82 <xs:complexType name="gtld">
|
|
83 <xs:sequence>
|
|
84 <xs:element name="status" minOccurs="0">
|
|
85 <xs:simpleType>
|
|
86 <xs:restriction base="xs:string">
|
|
87 <xs:enumeration value="INFRASTRUCTURE" />
|
|
88 <xs:enumeration value="SPONSORED" />
|
|
89 <xs:enumeration value="UNSPONSORED" />
|
|
90 <xs:enumeration value="STARTUP" />
|
|
91 <xs:enumeration value="PROPOSED" />
|
|
92 <xs:enumeration value="DELETED" />
|
|
93 <xs:enumeration value="PSEUDO_DOMAIN" />
|
|
94 </xs:restriction>
|
|
95 </xs:simpleType>
|
|
96 </xs:element>
|
|
97 <xs:element name="boost" type="xs:float" minOccurs="0" />
|
|
98 <xs:element name="description" type="xs:string" minOccurs="0" />
|
|
99 </xs:sequence>
|
|
100 <xs:attribute name="domain" type="xs:string" />
|
|
101 </xs:complexType>
|
|
102
|
|
103 <xs:complexType name="cctld">
|
|
104 <xs:sequence>
|
|
105 <xs:element name="country" type="xs:string" />
|
|
106 <xs:element name="status" type="statusType" minOccurs="0" />
|
|
107 <xs:element name="boost" type="xs:float" minOccurs="0" />
|
|
108 <xs:element name="description" type="xs:string" minOccurs="0" />
|
|
109 </xs:sequence>
|
|
110 <xs:attribute name="domain" type="xs:string" />
|
|
111 </xs:complexType>
|
|
112
|
|
113 <xs:complexType name="sldType">
|
|
114 <xs:sequence>
|
|
115 <xs:element name="status" type="statusType" minOccurs="0" />
|
|
116 <xs:element name="boost" type="xs:float" minOccurs="0" />
|
|
117 <xs:element name="description" type="xs:string" minOccurs="0" />
|
|
118 </xs:sequence>
|
|
119 <xs:attribute name="domain" type="xs:string" />
|
|
120 </xs:complexType>
|
|
121
|
|
122 <xs:simpleType name="statusType">
|
|
123 <xs:restriction base="xs:string">
|
|
124 <xs:enumeration value="IN_USE" />
|
|
125 <xs:enumeration value="NOT_IN_USE" />
|
|
126 <xs:enumeration value="DELETED" />
|
|
127 </xs:restriction>
|
|
128 </xs:simpleType>
|
|
129
|
|
130 </xs:schema>
|