| Total Complexity | 45 | 
| Total Lines | 174 | 
| Duplicated Lines | 0 % | 
Complex classes like pyspider.libs.Response often do a lot of different things. To break such a class down, we need to identify a cohesive component within that class. A common approach to find such a component is to look for fields/methods that share the same prefixes, or suffixes.
Once you have determined the fields that belong together, you can apply the Extract Class refactoring. If the component makes sense as a sub-class, Extract Subclass is also a candidate, and is often faster.
| 1 | #!/usr/bin/env python  | 
            ||
| 24 | class Response(object):  | 
            ||
| 25 | |||
| 26 | def __init__(self):  | 
            ||
| 27 | self.status_code = None  | 
            ||
| 28 | self.url = None  | 
            ||
| 29 | self.orig_url = None  | 
            ||
| 30 | self.headers = CaseInsensitiveDict()  | 
            ||
| 31 | self.content = ''  | 
            ||
| 32 |         self.cookies = {} | 
            ||
| 33 | self.error = None  | 
            ||
| 34 | self.save = None  | 
            ||
| 35 | self.js_script_result = None  | 
            ||
| 36 | self.time = 0  | 
            ||
| 37 | |||
| 38 | def __repr__(self):  | 
            ||
| 39 | return u'<Response [%d]>' % self.status_code  | 
            ||
| 40 | |||
| 41 | def __bool__(self):  | 
            ||
| 42 | """Returns true if `status_code` is 200 and no error"""  | 
            ||
| 43 | return self.ok  | 
            ||
| 44 | |||
| 45 | def __nonzero__(self):  | 
            ||
| 46 | """Returns true if `status_code` is 200 and no error."""  | 
            ||
| 47 | return self.ok  | 
            ||
| 48 | |||
| 49 | @property  | 
            ||
| 50 | def ok(self):  | 
            ||
| 51 | """Return true if `status_code` is 200 and no error."""  | 
            ||
| 52 | try:  | 
            ||
| 53 | self.raise_for_status()  | 
            ||
| 54 | except:  | 
            ||
| 55 | return False  | 
            ||
| 56 | return True  | 
            ||
| 57 | |||
| 58 | @property  | 
            ||
| 59 | def encoding(self):  | 
            ||
| 60 | """  | 
            ||
| 61 | encoding of Response.content.  | 
            ||
| 62 | |||
| 63 | if Response.encoding is None, encoding will be guessed  | 
            ||
| 64 | by header or content or chardet if available.  | 
            ||
| 65 | """  | 
            ||
| 66 | if hasattr(self, '_encoding'):  | 
            ||
| 67 | return self._encoding  | 
            ||
| 68 | |||
| 69 | # content is unicode  | 
            ||
| 70 | if isinstance(self.content, six.text_type):  | 
            ||
| 71 | return 'unicode'  | 
            ||
| 72 | |||
| 73 | # Try charset from content-type  | 
            ||
| 74 | encoding = get_encoding_from_headers(self.headers)  | 
            ||
| 75 | if encoding == 'ISO-8859-1':  | 
            ||
| 76 | encoding = None  | 
            ||
| 77 | |||
| 78 | # Try charset from content  | 
            ||
| 79 | if not encoding and get_encodings_from_content:  | 
            ||
| 80 | if six.PY3:  | 
            ||
| 81 | encoding = get_encodings_from_content(utils.pretty_unicode(self.content[:100]))  | 
            ||
| 82 | else:  | 
            ||
| 83 | encoding = get_encodings_from_content(self.content)  | 
            ||
| 84 | encoding = encoding and encoding[0] or None  | 
            ||
| 85 | |||
| 86 | # Fallback to auto-detected encoding.  | 
            ||
| 87 | if not encoding and chardet is not None:  | 
            ||
| 88 | encoding = chardet.detect(self.content)['encoding']  | 
            ||
| 89 | |||
| 90 | if encoding and encoding.lower() == 'gb2312':  | 
            ||
| 91 | encoding = 'gb18030'  | 
            ||
| 92 | |||
| 93 | self._encoding = encoding or 'utf-8'  | 
            ||
| 94 | return self._encoding  | 
            ||
| 95 | |||
| 96 | @encoding.setter  | 
            ||
| 97 | def encoding(self, value):  | 
            ||
| 98 | """  | 
            ||
| 99 | set encoding of content manually  | 
            ||
| 100 | it will overwrite the guessed encoding  | 
            ||
| 101 | """  | 
            ||
| 102 | self._encoding = value  | 
            ||
| 103 | self._text = None  | 
            ||
| 104 | |||
| 105 | @property  | 
            ||
| 106 | def text(self):  | 
            ||
| 107 | """  | 
            ||
| 108 | Content of the response, in unicode.  | 
            ||
| 109 | |||
| 110 | if Response.encoding is None and chardet module is available, encoding  | 
            ||
| 111 | will be guessed.  | 
            ||
| 112 | """  | 
            ||
| 113 | if hasattr(self, '_text') and self._text:  | 
            ||
| 114 | return self._text  | 
            ||
| 115 | if not self.content:  | 
            ||
| 116 | return u''  | 
            ||
| 117 | if isinstance(self.content, six.text_type):  | 
            ||
| 118 | return self.content  | 
            ||
| 119 | |||
| 120 | content = None  | 
            ||
| 121 | encoding = self.encoding  | 
            ||
| 122 | |||
| 123 | # Decode unicode from given encoding.  | 
            ||
| 124 | try:  | 
            ||
| 125 | content = self.content.decode(encoding, 'replace')  | 
            ||
| 126 | except LookupError:  | 
            ||
| 127 | # A LookupError is raised if the encoding was not found which could  | 
            ||
| 128 | # indicate a misspelling or similar mistake.  | 
            ||
| 129 | #  | 
            ||
| 130 | # So we try blindly encoding.  | 
            ||
| 131 |             content = self.content.decode('utf-8', 'replace') | 
            ||
| 132 | |||
| 133 | self._text = content  | 
            ||
| 134 | return content  | 
            ||
| 135 | |||
| 136 | @property  | 
            ||
| 137 | def json(self):  | 
            ||
| 138 | """Returns the json-encoded content of the response, if any."""  | 
            ||
| 139 | if hasattr(self, '_json'):  | 
            ||
| 140 | return self._json  | 
            ||
| 141 | try:  | 
            ||
| 142 | self._json = json.loads(self.text or self.content)  | 
            ||
| 143 | except ValueError:  | 
            ||
| 144 | self._json = None  | 
            ||
| 145 | return self._json  | 
            ||
| 146 | |||
| 147 | @property  | 
            ||
| 148 | def doc(self):  | 
            ||
| 149 | """Returns a PyQuery object of the response's content"""  | 
            ||
| 150 | if hasattr(self, '_doc'):  | 
            ||
| 151 | return self._doc  | 
            ||
| 152 | elements = self.etree  | 
            ||
| 153 | doc = self._doc = PyQuery(elements)  | 
            ||
| 154 | doc.make_links_absolute(self.url)  | 
            ||
| 155 | return doc  | 
            ||
| 156 | |||
| 157 | @property  | 
            ||
| 158 | def etree(self):  | 
            ||
| 159 | """Returns a lxml object of the response's content that can be selected by xpath"""  | 
            ||
| 160 | if not hasattr(self, '_elements'):  | 
            ||
| 161 | try:  | 
            ||
| 162 | parser = lxml.html.HTMLParser(encoding=self.encoding)  | 
            ||
| 163 | self._elements = lxml.html.fromstring(self.content, parser=parser)  | 
            ||
| 164 | except LookupError:  | 
            ||
| 165 | # lxml would raise LookupError when encoding not supported  | 
            ||
| 166 | # try fromstring without encoding instead.  | 
            ||
| 167 | # on windows, unicode is not availabe as encoding for lxml  | 
            ||
| 168 | self._elements = lxml.html.fromstring(self.content)  | 
            ||
| 169 | if isinstance(self._elements, lxml.etree._ElementTree):  | 
            ||
| 170 | self._elements = self._elements.getroot()  | 
            ||
| 171 | return self._elements  | 
            ||
| 172 | |||
| 173 | def raise_for_status(self, allow_redirects=True):  | 
            ||
| 174 | """Raises stored :class:`HTTPError` or :class:`URLError`, if one occurred."""  | 
            ||
| 175 | |||
| 176 | if self.status_code == 304:  | 
            ||
| 177 | return  | 
            ||
| 178 | elif self.error:  | 
            ||
| 179 | http_error = HTTPError(self.error)  | 
            ||
| 180 | elif (self.status_code >= 300) and (self.status_code < 400) and not allow_redirects:  | 
            ||
| 181 |             http_error = HTTPError('%s Redirection' % (self.status_code)) | 
            ||
| 182 | elif (self.status_code >= 400) and (self.status_code < 500):  | 
            ||
| 183 |             http_error = HTTPError('%s Client Error' % (self.status_code)) | 
            ||
| 184 | elif (self.status_code >= 500) and (self.status_code < 600):  | 
            ||
| 185 |             http_error = HTTPError('%s Server Error' % (self.status_code)) | 
            ||
| 186 | else:  | 
            ||
| 187 | return  | 
            ||
| 188 | |||
| 189 | http_error.response = self  | 
            ||
| 190 | raise http_error  | 
            ||
| 191 | |||
| 192 | def isok(self):  | 
            ||
| 193 | try:  | 
            ||
| 194 | self.raise_for_status()  | 
            ||
| 195 | return True  | 
            ||
| 196 | except:  | 
            ||
| 197 | return False  | 
            ||
| 198 | |||
| 213 |