distrib.py 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386
  1. # -*- test-case-name: twisted.web.test.test_distrib -*-
  2. # Copyright (c) Twisted Matrix Laboratories.
  3. # See LICENSE for details.
  4. """
  5. Distributed web servers.
  6. This is going to have to be refactored so that argument parsing is done
  7. by each subprocess and not by the main web server (i.e. GET, POST etc.).
  8. """
  9. # System Imports
  10. import os, copy
  11. try:
  12. import pwd
  13. except ImportError:
  14. pwd = None
  15. from io import BytesIO
  16. from xml.dom.minidom import getDOMImplementation
  17. # Twisted Imports
  18. from twisted.spread import pb
  19. from twisted.spread.banana import SIZE_LIMIT
  20. from twisted.web import http, resource, server, util, static
  21. from twisted.web.http_headers import Headers
  22. from twisted.persisted import styles
  23. from twisted.internet import address, reactor
  24. from twisted.logger import Logger
  25. class _ReferenceableProducerWrapper(pb.Referenceable):
  26. def __init__(self, producer):
  27. self.producer = producer
  28. def remote_resumeProducing(self):
  29. self.producer.resumeProducing()
  30. def remote_pauseProducing(self):
  31. self.producer.pauseProducing()
  32. def remote_stopProducing(self):
  33. self.producer.stopProducing()
  34. class Request(pb.RemoteCopy, server.Request):
  35. """
  36. A request which was received by a L{ResourceSubscription} and sent via
  37. PB to a distributed node.
  38. """
  39. def setCopyableState(self, state):
  40. """
  41. Initialize this L{twisted.web.distrib.Request} based on the copied
  42. state so that it closely resembles a L{twisted.web.server.Request}.
  43. """
  44. for k in 'host', 'client':
  45. tup = state[k]
  46. addrdesc = {'INET': 'TCP', 'UNIX': 'UNIX'}[tup[0]]
  47. addr = {'TCP': lambda: address.IPv4Address(addrdesc,
  48. tup[1], tup[2]),
  49. 'UNIX': lambda: address.UNIXAddress(tup[1])}[addrdesc]()
  50. state[k] = addr
  51. state['requestHeaders'] = Headers(dict(state['requestHeaders']))
  52. pb.RemoteCopy.setCopyableState(self, state)
  53. # Emulate the local request interface --
  54. self.content = BytesIO(self.content_data)
  55. self.finish = self.remote.remoteMethod('finish')
  56. self.setHeader = self.remote.remoteMethod('setHeader')
  57. self.addCookie = self.remote.remoteMethod('addCookie')
  58. self.setETag = self.remote.remoteMethod('setETag')
  59. self.setResponseCode = self.remote.remoteMethod('setResponseCode')
  60. self.setLastModified = self.remote.remoteMethod('setLastModified')
  61. # To avoid failing if a resource tries to write a very long string
  62. # all at once, this one will be handled slightly differently.
  63. self._write = self.remote.remoteMethod('write')
  64. def write(self, bytes):
  65. """
  66. Write the given bytes to the response body.
  67. @param bytes: The bytes to write. If this is longer than 640k, it
  68. will be split up into smaller pieces.
  69. """
  70. start = 0
  71. end = SIZE_LIMIT
  72. while True:
  73. self._write(bytes[start:end])
  74. start += SIZE_LIMIT
  75. end += SIZE_LIMIT
  76. if start >= len(bytes):
  77. break
  78. def registerProducer(self, producer, streaming):
  79. self.remote.callRemote("registerProducer",
  80. _ReferenceableProducerWrapper(producer),
  81. streaming).addErrback(self.fail)
  82. def unregisterProducer(self):
  83. self.remote.callRemote("unregisterProducer").addErrback(self.fail)
  84. def fail(self, failure):
  85. self._log.failure('', failure=failure)
  86. pb.setUnjellyableForClass(server.Request, Request)
  87. class Issue:
  88. _log = Logger()
  89. def __init__(self, request):
  90. self.request = request
  91. def finished(self, result):
  92. if result is not server.NOT_DONE_YET:
  93. assert isinstance(result, str), "return value not a string"
  94. self.request.write(result)
  95. self.request.finish()
  96. def failed(self, failure):
  97. #XXX: Argh. FIXME.
  98. failure = str(failure)
  99. self.request.write(
  100. resource.ErrorPage(http.INTERNAL_SERVER_ERROR,
  101. "Server Connection Lost",
  102. "Connection to distributed server lost:" +
  103. util._PRE(failure)).
  104. render(self.request))
  105. self.request.finish()
  106. self._log.info(failure)
  107. class ResourceSubscription(resource.Resource):
  108. isLeaf = 1
  109. waiting = 0
  110. _log = Logger()
  111. def __init__(self, host, port):
  112. resource.Resource.__init__(self)
  113. self.host = host
  114. self.port = port
  115. self.pending = []
  116. self.publisher = None
  117. def __getstate__(self):
  118. """Get persistent state for this ResourceSubscription.
  119. """
  120. # When I unserialize,
  121. state = copy.copy(self.__dict__)
  122. # Publisher won't be connected...
  123. state['publisher'] = None
  124. # I won't be making a connection
  125. state['waiting'] = 0
  126. # There will be no pending requests.
  127. state['pending'] = []
  128. return state
  129. def connected(self, publisher):
  130. """I've connected to a publisher; I'll now send all my requests.
  131. """
  132. self._log.info('connected to publisher')
  133. publisher.broker.notifyOnDisconnect(self.booted)
  134. self.publisher = publisher
  135. self.waiting = 0
  136. for request in self.pending:
  137. self.render(request)
  138. self.pending = []
  139. def notConnected(self, msg):
  140. """I can't connect to a publisher; I'll now reply to all pending
  141. requests.
  142. """
  143. self._log.info(
  144. "could not connect to distributed web service: {msg}",
  145. msg=msg
  146. )
  147. self.waiting = 0
  148. self.publisher = None
  149. for request in self.pending:
  150. request.write("Unable to connect to distributed server.")
  151. request.finish()
  152. self.pending = []
  153. def booted(self):
  154. self.notConnected("connection dropped")
  155. def render(self, request):
  156. """Render this request, from my server.
  157. This will always be asynchronous, and therefore return NOT_DONE_YET.
  158. It spins off a request to the pb client, and either adds it to the list
  159. of pending issues or requests it immediately, depending on if the
  160. client is already connected.
  161. """
  162. if not self.publisher:
  163. self.pending.append(request)
  164. if not self.waiting:
  165. self.waiting = 1
  166. bf = pb.PBClientFactory()
  167. timeout = 10
  168. if self.host == "unix":
  169. reactor.connectUNIX(self.port, bf, timeout)
  170. else:
  171. reactor.connectTCP(self.host, self.port, bf, timeout)
  172. d = bf.getRootObject()
  173. d.addCallbacks(self.connected, self.notConnected)
  174. else:
  175. i = Issue(request)
  176. self.publisher.callRemote('request', request).addCallbacks(i.finished, i.failed)
  177. return server.NOT_DONE_YET
  178. class ResourcePublisher(pb.Root, styles.Versioned):
  179. """
  180. L{ResourcePublisher} exposes a remote API which can be used to respond
  181. to request.
  182. @ivar site: The site which will be used for resource lookup.
  183. @type site: L{twisted.web.server.Site}
  184. """
  185. _log = Logger()
  186. def __init__(self, site):
  187. self.site = site
  188. persistenceVersion = 2
  189. def upgradeToVersion2(self):
  190. self.application.authorizer.removeIdentity("web")
  191. del self.application.services[self.serviceName]
  192. del self.serviceName
  193. del self.application
  194. del self.perspectiveName
  195. def getPerspectiveNamed(self, name):
  196. return self
  197. def remote_request(self, request):
  198. """
  199. Look up the resource for the given request and render it.
  200. """
  201. res = self.site.getResourceFor(request)
  202. self._log.info(request)
  203. result = res.render(request)
  204. if result is not server.NOT_DONE_YET:
  205. request.write(result)
  206. request.finish()
  207. return server.NOT_DONE_YET
  208. class UserDirectory(resource.Resource):
  209. """
  210. A resource which lists available user resources and serves them as
  211. children.
  212. @ivar _pwd: An object like L{pwd} which is used to enumerate users and
  213. their home directories.
  214. """
  215. userDirName = 'public_html'
  216. userSocketName = '.twistd-web-pb'
  217. template = """
  218. <html>
  219. <head>
  220. <title>twisted.web.distrib.UserDirectory</title>
  221. <style>
  222. a
  223. {
  224. font-family: Lucida, Verdana, Helvetica, Arial, sans-serif;
  225. color: #369;
  226. text-decoration: none;
  227. }
  228. th
  229. {
  230. font-family: Lucida, Verdana, Helvetica, Arial, sans-serif;
  231. font-weight: bold;
  232. text-decoration: none;
  233. text-align: left;
  234. }
  235. pre, code
  236. {
  237. font-family: "Courier New", Courier, monospace;
  238. }
  239. p, body, td, ol, ul, menu, blockquote, div
  240. {
  241. font-family: Lucida, Verdana, Helvetica, Arial, sans-serif;
  242. color: #000;
  243. }
  244. </style>
  245. </head>
  246. <body>
  247. <h1>twisted.web.distrib.UserDirectory</h1>
  248. %(users)s
  249. </body>
  250. </html>
  251. """
  252. def __init__(self, userDatabase=None):
  253. resource.Resource.__init__(self)
  254. if userDatabase is None:
  255. userDatabase = pwd
  256. self._pwd = userDatabase
  257. def _users(self):
  258. """
  259. Return a list of two-tuples giving links to user resources and text to
  260. associate with those links.
  261. """
  262. users = []
  263. for user in self._pwd.getpwall():
  264. name, passwd, uid, gid, gecos, dir, shell = user
  265. realname = gecos.split(',')[0]
  266. if not realname:
  267. realname = name
  268. if os.path.exists(os.path.join(dir, self.userDirName)):
  269. users.append((name, realname + ' (file)'))
  270. twistdsock = os.path.join(dir, self.userSocketName)
  271. if os.path.exists(twistdsock):
  272. linkName = name + '.twistd'
  273. users.append((linkName, realname + ' (twistd)'))
  274. return users
  275. def render_GET(self, request):
  276. """
  277. Render as HTML a listing of all known users with links to their
  278. personal resources.
  279. """
  280. domImpl = getDOMImplementation()
  281. newDoc = domImpl.createDocument(None, "ul", None)
  282. listing = newDoc.documentElement
  283. for link, text in self._users():
  284. linkElement = newDoc.createElement('a')
  285. linkElement.setAttribute('href', link + '/')
  286. textNode = newDoc.createTextNode(text)
  287. linkElement.appendChild(textNode)
  288. item = newDoc.createElement('li')
  289. item.appendChild(linkElement)
  290. listing.appendChild(item)
  291. htmlDoc = self.template % ({'users': listing.toxml()})
  292. return htmlDoc.encode("utf-8")
  293. def getChild(self, name, request):
  294. if name == '':
  295. return self
  296. td = '.twistd'
  297. if name[-len(td):] == td:
  298. username = name[:-len(td)]
  299. sub = 1
  300. else:
  301. username = name
  302. sub = 0
  303. try:
  304. pw_name, pw_passwd, pw_uid, pw_gid, pw_gecos, pw_dir, pw_shell \
  305. = self._pwd.getpwnam(username)
  306. except KeyError:
  307. return resource.NoResource()
  308. if sub:
  309. twistdsock = os.path.join(pw_dir, self.userSocketName)
  310. rs = ResourceSubscription('unix',twistdsock)
  311. self.putChild(name, rs)
  312. return rs
  313. else:
  314. path = os.path.join(pw_dir, self.userDirName)
  315. if not os.path.exists(path):
  316. return resource.NoResource()
  317. return static.File(path)