home *** CD-ROM | disk | FTP | other *** search
- # Gopher protocol client interface
-
- import string
-
- # Default selector, host and port
- DEF_SELECTOR = '1/'
- DEF_HOST = 'gopher.micro.umn.edu'
- DEF_PORT = 70
-
- # Recognized file types
- A_TEXT = '0'
- A_MENU = '1'
- A_CSO = '2'
- A_ERROR = '3'
- A_MACBINHEX = '4'
- A_PCBINHEX = '5'
- A_UUENCODED = '6'
- A_INDEX = '7'
- A_TELNET = '8'
- A_BINARY = '9'
- A_DUPLICATE = '+'
- A_SOUND = 's'
- A_EVENT = 'e'
- A_CALENDAR = 'c'
- A_HTML = 'h'
- A_TN3270 = 'T'
- A_MIME = 'M'
- A_IMAGE = 'I'
- A_WHOIS = 'w'
- A_QUERY = 'q'
- A_GIF = 'g'
- A_HTML = 'h' # HTML file
- A_WWW = 'w' # WWW address
- A_PLUS_IMAGE = ':'
- A_PLUS_MOVIE = ';'
- A_PLUS_SOUND = '<'
-
-
- # Function mapping all file types to strings; unknown types become TYPE='x'
- _names = dir()
- _type_to_name_map = {}
- def type_to_name(gtype):
- global _type_to_name_map
- if _type_to_name_map=={}:
- for name in _names:
- if name[:2] == 'A_':
- _type_to_name_map[eval(name)] = name[2:]
- if _type_to_name_map.has_key(gtype):
- return _type_to_name_map[gtype]
- return 'TYPE=' + `gtype`
-
- # Names for characters and strings
- CRLF = '\r\n'
- TAB = '\t'
-
- # Send a selector to a given host and port, return a file with the reply
- def send_selector(selector, host, port = 0):
- import socket
- import string
- if not port:
- i = string.find(host, ':')
- if i >= 0:
- host, port = host[:i], string.atoi(host[i+1:])
- if not port:
- port = DEF_PORT
- elif type(port) == type(''):
- port = string.atoi(port)
- s = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
- s.connect(host, port)
- s.send(selector + CRLF)
- s.shutdown(1)
- return s.makefile('rb')
-
- # Send a selector and a query string
- def send_query(selector, query, host, port = 0):
- return send_selector(selector + '\t' + query, host, port)
-
- # Takes a path as returned by urlparse and returns the appropriate selector
- def path_to_selector(path):
- if path=="/":
- return "/"
- else:
- return path[2:] # Cuts initial slash and data type identifier
-
- # Takes a path as returned by urlparse and maps it to a string
- # See section 3.4 of RFC 1738 for details
- def path_to_datatype_name(path):
- if path=="/":
- # No way to tell, although "INDEX" is likely
- return "TYPE='unknown'"
- else:
- return type_to_name(path[1])
-
- # The following functions interpret the data returned by the gopher
- # server according to the expected type, e.g. textfile or directory
-
- # Get a directory in the form of a list of entries
- def get_directory(f):
- import string
- list = []
- while 1:
- line = f.readline()
- if not line:
- print '(Unexpected EOF from server)'
- break
- if line[-2:] == CRLF:
- line = line[:-2]
- elif line[-1:] in CRLF:
- line = line[:-1]
- if line == '.':
- break
- if not line:
- print '(Empty line from server)'
- continue
- gtype = line[0]
- parts = string.splitfields(line[1:], TAB)
- if len(parts) < 4:
- print '(Bad line from server:', `line`, ')'
- continue
- if len(parts) > 4:
- if parts[4:] != ['+']:
- print '(Extra info from server:',
- print parts[4:], ')'
- else:
- parts.append('')
- parts.insert(0, gtype)
- list.append(parts)
- return list
-
- # Get a text file as a list of lines, with trailing CRLF stripped
- def get_textfile(f):
- list = []
- get_alt_textfile(f, list.append)
- return list
-
- # Get a text file and pass each line to a function, with trailing CRLF stripped
- def get_alt_textfile(f, func):
- while 1:
- line = f.readline()
- if not line:
- print '(Unexpected EOF from server)'
- break
- if line[-2:] == CRLF:
- line = line[:-2]
- elif line[-1:] in CRLF:
- line = line[:-1]
- if line == '.':
- break
- if line[:2] == '..':
- line = line[1:]
- func(line)
-
- # Get a binary file as one solid data block
- def get_binary(f):
- data = f.read()
- return data
-
- # Get a binary file and pass each block to a function
- def get_alt_binary(f, func, blocksize):
- while 1:
- data = f.read(blocksize)
- if not data:
- break
- func(data)
-
- # Trivial test program
- def test():
- import sys
- import getopt
- opts, args = getopt.getopt(sys.argv[1:], '')
- selector = DEF_SELECTOR
- type = selector[0]
- host = DEF_HOST
- port = DEF_PORT
- if args:
- host = args[0]
- args = args[1:]
- if args:
- type = args[0]
- args = args[1:]
- if len(type) > 1:
- type, selector = type[0], type
- else:
- selector = ''
- if args:
- selector = args[0]
- args = args[1:]
- query = ''
- if args:
- query = args[0]
- args = args[1:]
- if type == A_INDEX:
- f = send_query(selector, query, host)
- else:
- f = send_selector(selector, host)
- if type == A_TEXT:
- list = get_textfile(f)
- for item in list: print item
- elif type in (A_MENU, A_INDEX):
- list = get_directory(f)
- for item in list: print item
- else:
- data = get_binary(f)
- print 'binary data:', len(data), 'bytes:', `data[:100]`[:40]
-
- # Run the test when run as script
- if __name__ == '__main__':
- test()
-