diff --git a/tests/test_cluster.py b/tests/test_cluster.py
deleted file mode 100644
index 9225e56..0000000
--- a/tests/test_cluster.py
+++ /dev/null
@@ -1,192 +0,0 @@
-# coding=utf-8
-
-import asyncio
-import logging
-from urllib.parse import urljoin
-
-from xpaw.spider import Spider
-from xpaw.http import HttpRequest
-from xpaw.selector import Selector
-from xpaw.run import run_spider
-from xpaw.handler import every
-from xpaw.item import Item, Field
-from xpaw.errors import IgnoreItem
-from xpaw.queue import PriorityQueue
-
-
-class FooSpider(Spider):
-    def start_requests(self):
-        yield HttpRequest('http://localhost:80')
-        yield HttpRequest('http://httpbin.org/get')
-
-    async def parse(self, response):
-        await asyncio.sleep(1, loop=self.cluster.loop)
-        return ()
-
-
-class BadQueue(PriorityQueue):
-    async def pop(self):
-        req = await super().pop()
-        if req.url == 'http://localhost:80':
-            raise RuntimeError('not an error actually')
-        return req
-
-
-def test_coro_terminated():
-    run_spider(FooSpider, downloader_clients=2, queue_cls=BadQueue, max_retry_times=0)
-    logging.getLogger('xpaw').handlers.clear()
-
-
-class LinkItem(Item):
-    url = Field()
-
-
-class LinkPipeline:
-    def __init__(self, n, tot, data, cluster):
-        self.n = n
-        self.tot = tot
-        self.data = data
-        self.cluster = cluster
-
-    @classmethod
-    def from_cluster(cls, cluster):
-        n = cluster.config.getint('link_count')
-        data = cluster.config.get('link_data')
-        tot = cluster.config.getint('link_total')
-        return cls(n, tot, data, cluster)
-
-    async def handle_item(self, item):
-        url = item['url']
-        if url == "http://httpbin.org/links/{}".format(self.n):
-            raise IgnoreItem
-        self.data.add(url)
-
-
-class MyError(Exception):
-    pass
-
-
-class LinkDownloaderMiddleware:
-    def handle_request(self, request):
-        if request.url == 'http://httpbin.org/status/406':
-            return HttpRequest('http://httpbin.org/status/407')
-        if request.url == 'http://httpbin.org/status/410':
-            raise MyError
-
-    def handle_response(self, request, response):
-        if request.url == 'http://httpbin.org/status/407':
-            return HttpRequest('http://httpbin.org/status/409')
-
-    def handle_error(self, request, error):
-        if isinstance(error, MyError):
-            return HttpRequest('http://httpbin.org/status/411')
-
-
-class LinkSpiderMiddleware:
-    def handle_input(self, response):
-        if response.request.url == 'http://httpbin.org/status/412':
-            raise MyError
-
-    def handle_output(self, response, result):
-        return result
-
-    def handle_error(self, response, error):
-        if isinstance(error, MyError):
-            return ()
-
-
-class LinkSpider(Spider):
-    def __init__(self, *args, **kwargs):
-        super().__init__(*args, **kwargs)
-        self.link_count = self.config.get('link_count')
-        self.data = self.config.get('link_data')
-        self.tot = self.config.get('link_total')
-
-    def open(self):
-        asyncio.ensure_future(self.supervisor(), loop=self.cluster.loop)
-
-    async def supervisor(self):
-        while True:
-            if len(self.data) >= self.tot:
-                asyncio.ensure_future(self.cluster.shutdown(), loop=self.cluster.loop)
-                break
-            await asyncio.sleep(1, loop=self.cluster.loop)
-
-    @every(seconds=30)
-    def start_requests(self):
-        yield HttpRequest("http://localhost:80", errback=self.error_back)
-        yield HttpRequest("http://localhost:81", errback=self.async_error_back)
-        yield HttpRequest("http://httpbin.org/status/401", callback=self.generator_parse)
-        yield HttpRequest("http://httpbin.org/status/402", callback=self.func_prase)
-        yield HttpRequest("http://httpbin.org/status/403", callback=self.async_parse)
-        yield HttpRequest("http://httpbin.org/status/404", callback=self.return_list_parse)
-        yield HttpRequest("http://httpbin.org/status/405", callback=self.return_none)
-        yield HttpRequest("http://httpbin.org/status/406")
-        yield HttpRequest("http://httpbin.org/status/408")
-        yield HttpRequest("http://httpbin.org/status/410")
-        yield HttpRequest("http://httpbin.org/status/412", errback=self.handle_input_error)
-        yield HttpRequest("http://httpbin.org/links/{}".format(self.link_count))
-
-    def parse(self, response):
-        selector = Selector(response.text)
-        for href in selector.xpath('//a/@href').text:
-            yield HttpRequest(urljoin(str(response.url), href))
-        yield LinkItem(url=response.request.url)
-
-    def error_back(self, request, err):
-        self.data.add(request.url)
-        raise RuntimeError('not an error actually')
-
-    async def async_error_back(self, request, err):
-        self.data.add(request.url)
-        raise RuntimeError('not an error actually')
-
-    def generator_parse(self, response):
-        self.data.add(response.request.url)
-        if response.status / 100 != 2:
-            raise RuntimeError('not an error actually')
-        # it will never come here
-        yield None
-
-    def func_prase(self, response):
-        self.data.add(response.request.url)
-        raise RuntimeError('not an error actually')
-
-    async def async_parse(self, response):
-        self.data.add(response.request.url)
-        raise RuntimeError('not an error actually')
-
-    def return_list_parse(self, response):
-        self.data.add(response.request.url)
-        return []
-
-    def return_none(self, response):
-        self.data.add(response.request.url)
-
-    def handle_input_error(self, request, error):
-        assert isinstance(error, MyError)
-        self.data.add(request.url)
-
-
-def test_run_link_spider():
-    link_data = set()
-    link_count = 5
-    link_total = 15
-    run_spider(LinkSpider, downloader_timeout=60, log_level='DEBUG', item_pipelines=[LinkPipeline],
-               link_data=link_data, link_count=link_count, link_total=link_total, max_retry_times=1,
-               downloader_clients=10, spider_middlewares=[LinkSpiderMiddleware],
-               downloader_middlewares=[LinkDownloaderMiddleware])
-    assert len(link_data) == link_total
-    for i in range(link_count):
-        assert "http://httpbin.org/links/{}/{}".format(link_count, i) in link_data
-    assert "http://localhost:80" in link_data
-    assert "http://localhost:81" in link_data
-    assert "http://httpbin.org/status/401" in link_data
-    assert "http://httpbin.org/status/402" in link_data
-    assert "http://httpbin.org/status/403" in link_data
-    assert "http://httpbin.org/status/404" in link_data
-    assert "http://httpbin.org/status/405" in link_data
-    assert "http://httpbin.org/status/409" in link_data
-    assert "http://httpbin.org/status/411" in link_data
-    assert "http://httpbin.org/status/412" in link_data
-    logging.getLogger('xpaw').handlers.clear()
diff --git a/tests/test_run.py b/tests/test_run.py
index b67f389..7bf13cc 100644
--- a/tests/test_run.py
+++ b/tests/test_run.py
@@ -1,12 +1,21 @@
 # coding=utf-8
 
 from os.path import join
+import asyncio
 import logging
+from urllib.parse import urljoin
 
 import pytest
 
 from xpaw.cli import main
 from xpaw.run import run_crawler
+from xpaw.spider import Spider
+from xpaw.http import HttpRequest
+from xpaw.selector import Selector
+from xpaw.run import run_spider
+from xpaw.item import Item, Field
+from xpaw.errors import IgnoreItem
+from xpaw.queue import PriorityQueue
 
 
 def test_run_crawler(tmpdir, capsys):
@@ -18,3 +27,167 @@ def test_run_crawler(tmpdir, capsys):
     run_crawler(proj_dir, downloader_timeout=0.01, log_level='WARNING')
     _, _ = capsys.readouterr()
     logging.getLogger('xpaw').handlers.clear()
+
+
+class FooSpider(Spider):
+    def start_requests(self):
+        yield HttpRequest('http://localhost:80')
+        yield HttpRequest('http://httpbin.org/get')
+
+    async def parse(self, response):
+        await asyncio.sleep(1, loop=self.cluster.loop)
+        return ()
+
+
+class BadQueue(PriorityQueue):
+    async def pop(self):
+        req = await super().pop()
+        if req.url == 'http://localhost:80':
+            raise RuntimeError('not an error actually')
+        return req
+
+
+def test_coro_terminated():
+    run_spider(FooSpider, downloader_clients=2, queue_cls=BadQueue, max_retry_times=0)
+    logging.getLogger('xpaw').handlers.clear()
+
+
+class LinkItem(Item):
+    url = Field()
+
+
+class LinkPipeline:
+    def __init__(self, n, data, cluster):
+        self.n = n
+        self.data = data
+        self.cluster = cluster
+
+    @classmethod
+    def from_cluster(cls, cluster):
+        n = cluster.config.getint('link_count')
+        data = cluster.config.get('link_data')
+        return cls(n, data, cluster)
+
+    async def handle_item(self, item):
+        url = item['url']
+        if url == "http://httpbin.org/links/{}".format(self.n):
+            raise IgnoreItem
+        self.data.add(url)
+
+
+class MyError(Exception):
+    pass
+
+
+class LinkDownloaderMiddleware:
+    def handle_request(self, request):
+        if request.url == 'http://httpbin.org/status/406':
+            return HttpRequest('http://httpbin.org/status/407')
+        if request.url == 'http://httpbin.org/status/410':
+            raise MyError
+
+    def handle_response(self, request, response):
+        if request.url == 'http://httpbin.org/status/407':
+            return HttpRequest('http://httpbin.org/status/409')
+
+    def handle_error(self, request, error):
+        if isinstance(error, MyError):
+            return HttpRequest('http://httpbin.org/status/411')
+
+
+class LinkSpiderMiddleware:
+    def handle_input(self, response):
+        if response.request.url == 'http://httpbin.org/status/412':
+            raise MyError
+
+    def handle_output(self, response, result):
+        return result
+
+    def handle_error(self, response, error):
+        if isinstance(error, MyError):
+            return ()
+
+
+class LinkSpider(Spider):
+    def __init__(self, *args, **kwargs):
+        super().__init__(*args, **kwargs)
+        self.link_count = self.config.get('link_count')
+        self.data = self.config.get('link_data')
+
+    def start_requests(self):
+        yield HttpRequest("http://localhost:80", errback=self.error_back)
+        yield HttpRequest("http://localhost:81", errback=self.async_error_back)
+        yield HttpRequest("http://httpbin.org/status/401", callback=self.generator_parse)
+        yield HttpRequest("http://httpbin.org/status/402", callback=self.func_prase)
+        yield HttpRequest("http://httpbin.org/status/403", callback=self.async_parse)
+        yield HttpRequest("http://httpbin.org/status/404", callback=self.return_list_parse)
+        yield HttpRequest("http://httpbin.org/status/405", callback=self.return_none)
+        yield HttpRequest("http://httpbin.org/status/406")
+        yield HttpRequest("http://httpbin.org/status/408")
+        yield HttpRequest("http://httpbin.org/status/410")
+        yield HttpRequest("http://httpbin.org/status/412", errback=self.handle_input_error)
+        yield HttpRequest("http://httpbin.org/links/{}".format(self.link_count))
+
+    def parse(self, response):
+        selector = Selector(response.text)
+        for href in selector.xpath('//a/@href').text:
+            yield HttpRequest(urljoin(str(response.url), href))
+        yield LinkItem(url=response.request.url)
+
+    def error_back(self, request, err):
+        self.data.add(request.url)
+        raise RuntimeError('not an error actually')
+
+    async def async_error_back(self, request, err):
+        self.data.add(request.url)
+        raise RuntimeError('not an error actually')
+
+    def generator_parse(self, response):
+        self.data.add(response.request.url)
+        if response.status / 100 != 2:
+            raise RuntimeError('not an error actually')
+        # it will never come here
+        yield None
+
+    def func_prase(self, response):
+        self.data.add(response.request.url)
+        raise RuntimeError('not an error actually')
+
+    async def async_parse(self, response):
+        self.data.add(response.request.url)
+        raise RuntimeError('not an error actually')
+
+    def return_list_parse(self, response):
+        self.data.add(response.request.url)
+        return []
+
+    def return_none(self, response):
+        self.data.add(response.request.url)
+
+    def handle_input_error(self, request, error):
+        assert isinstance(error, MyError)
+        self.data.add(request.url)
+
+
+def test_run_spider():
+    link_data = set()
+    link_count = 5
+    link_total = 15
+    run_spider(LinkSpider, downloader_timeout=60, log_level='DEBUG', item_pipelines=[LinkPipeline],
+               link_data=link_data, link_count=link_count, max_retry_times=1,
+               downloader_clients=10, spider_middlewares=[LinkSpiderMiddleware],
+               downloader_middlewares=[LinkDownloaderMiddleware])
+    assert len(link_data) == link_total
+    for i in range(link_count):
+        assert "http://httpbin.org/links/{}/{}".format(link_count, i) in link_data
+    assert "http://localhost:80" in link_data
+    assert "http://localhost:81" in link_data
+    assert "http://httpbin.org/status/401" in link_data
+    assert "http://httpbin.org/status/402" in link_data
+    assert "http://httpbin.org/status/403" in link_data
+    assert "http://httpbin.org/status/404" in link_data
+    assert "http://httpbin.org/status/405" in link_data
+    assert "http://httpbin.org/status/409" in link_data
+    assert "http://httpbin.org/status/411" in link_data
+    assert "http://httpbin.org/status/412" in link_data
+    logging.getLogger('xpaw').handlers.clear()
diff --git a/tests/test_selector.py b/tests/test_selector.py
index 72aebe1..d878202 100644
--- a/tests/test_selector.py
+++ b/tests/test_selector.py
@@ -6,7 +6,7 @@
 from xpaw.selector import Selector
 
 
-class TestSelector:
+class TestXPathSelector:
     def test_selector_list(self):
         html = """<li>a</li><div><ul><li>b</li><li>c</li></ul></div><ul><li>d</li></ul>"""
         s = Selector(html)
@@ -22,21 +22,24 @@ def test_attribute_selection(self):
         assert s.xpath("//a/@href")[0].text == "http://example.com/"
         assert s.xpath("//a/@target")[0].text == "_blank"
 
-    def test_text(self):
+    def test_text_selection(self):
         html = """<div><p>expression: <var>x</var>+<var>y</var>=<var>z</var></p></div>"""
         s = Selector(html)
         assert s.xpath("//var/text()")[0].text == "x"
         assert s.xpath("//var")[0].text == "x"
+        assert s.xpath("//var[last()]").text == ["z"]
         assert s.xpath("//var/text()").text == ["x", "y", "z"]
         assert s.xpath("//var").text == ["x", "y", "z"]
-        assert s.xpath("//p")[0].string == "<p>expression: <var>x</var>+<var>y</var>=<var>z</var></p>"
         assert s.xpath("//p")[0].text == "expression: x+y=z"
         assert s.xpath("//p/text()")[0].string == "expression: "
 
-        xs = Selector(html, doctype='xml')
-        assert xs.xpath("//p")[0].string == "<p>expression: <var>x</var>+<var>y</var>=<var>z</var></p>"
-        assert xs.xpath("//p")[0].text == "expression: x+y=z"
-        assert xs.xpath("//p/text()")[0].string == "expression: "
+    def test_diff_between_string_and_text(self):
+        html = """<div><p>expression: <var>x</var>+<var>y</var>=<var>z</var></p></div>"""
+        s = Selector(html)
+        assert s.xpath("//var")[0].text == "x"
+        assert s.xpath("//var")[0].string == "<var>x</var>"
+        assert s.xpath("//var").text == ["x", "y", "z"]
+        assert s.xpath("//var").string == ["<var>x</var>", "<var>y</var>", "<var>z</var>"]
 
     def test_node_selection(self):
         html = """<p></p><p class='primary'>primary</p><p class="minor gray">minor</p>"""
@@ -140,3 +143,37 @@ def test_attribute_selection(self):
         assert s.css('ul').attr('class') == [None]
         assert s.css('ul')[0].attr('class') is None
         assert s.css('h2').attr('class') == []
+
+
+class TestDoctypeXml:
+    def test_text_selection(self):
+        xml = """<div><p>expression: <var>x</var>+<var>y</var>=<var>z</var></p></div>"""
+        xs = Selector(xml, doctype='xml')
+        assert xs.xpath("//var/text()")[0].text == "x"
+        assert xs.xpath("//var")[0].text == "x"
+        assert xs.xpath("//var/text()").text == ["x", "y", "z"]
+        assert xs.xpath("//var").text == ["x", "y", "z"]
+
+    def test_not_xml(self):
+        from lxml.etree import XMLSyntaxError
+        xml = """expression: <var>x</var>+<var>y</var>=<var>z</var>"""
+        with pytest.raises(XMLSyntaxError):
+            xs = Selector(xml, doctype='xml')
+
+
+def test_selection_error():
+    xml = """
+    <bookstore>
+      <book>
+        <title lang="eng">Harry Potter</title>
+        <price>29.99</price>
+      </book>
+      <book>
+        <title lang="eng">Learning XML</title>
+        <price>39.95</price>
+      </book>
+    </bookstore>"""
+
+    s = Selector(xml, doctype='xml')
+    assert s.xpath('/bookstore/book[first()]') == []
+    assert s.css('book >> price') == []