github.com/xushiwei/go@v0.0.0-20130601165731-2b9d83f45bc9/src/pkg/net/http/cgi/host.go (about)

     1  // Copyright 2011 The Go Authors. All rights reserved.
     2  // Use of this source code is governed by a BSD-style
     3  // license that can be found in the LICENSE file.
     4  
     5  // This file implements the host side of CGI (being the webserver
     6  // parent process).
     7  
     8  // Package cgi implements CGI (Common Gateway Interface) as specified
     9  // in RFC 3875.
    10  //
    11  // Note that using CGI means starting a new process to handle each
    12  // request, which is typically less efficient than using a
    13  // long-running server.  This package is intended primarily for
    14  // compatibility with existing systems.
    15  package cgi
    16  
    17  import (
    18  	"bufio"
    19  	"fmt"
    20  	"io"
    21  	"log"
    22  	"net/http"
    23  	"os"
    24  	"os/exec"
    25  	"path/filepath"
    26  	"regexp"
    27  	"runtime"
    28  	"strconv"
    29  	"strings"
    30  )
    31  
    32  var trailingPort = regexp.MustCompile(`:([0-9]+)$`)
    33  
    34  var osDefaultInheritEnv = map[string][]string{
    35  	"darwin":  {"DYLD_LIBRARY_PATH"},
    36  	"freebsd": {"LD_LIBRARY_PATH"},
    37  	"hpux":    {"LD_LIBRARY_PATH", "SHLIB_PATH"},
    38  	"irix":    {"LD_LIBRARY_PATH", "LD_LIBRARYN32_PATH", "LD_LIBRARY64_PATH"},
    39  	"linux":   {"LD_LIBRARY_PATH"},
    40  	"openbsd": {"LD_LIBRARY_PATH"},
    41  	"solaris": {"LD_LIBRARY_PATH", "LD_LIBRARY_PATH_32", "LD_LIBRARY_PATH_64"},
    42  	"windows": {"SystemRoot", "COMSPEC", "PATHEXT", "WINDIR"},
    43  }
    44  
    45  // Handler runs an executable in a subprocess with a CGI environment.
    46  type Handler struct {
    47  	Path string // path to the CGI executable
    48  	Root string // root URI prefix of handler or empty for "/"
    49  
    50  	// Dir specifies the CGI executable's working directory.
    51  	// If Dir is empty, the base directory of Path is used.
    52  	// If Path has no base directory, the current working
    53  	// directory is used.
    54  	Dir string
    55  
    56  	Env        []string    // extra environment variables to set, if any, as "key=value"
    57  	InheritEnv []string    // environment variables to inherit from host, as "key"
    58  	Logger     *log.Logger // optional log for errors or nil to use log.Print
    59  	Args       []string    // optional arguments to pass to child process
    60  
    61  	// PathLocationHandler specifies the root http Handler that
    62  	// should handle internal redirects when the CGI process
    63  	// returns a Location header value starting with a "/", as
    64  	// specified in RFC 3875 ยง 6.3.2. This will likely be
    65  	// http.DefaultServeMux.
    66  	//
    67  	// If nil, a CGI response with a local URI path is instead sent
    68  	// back to the client and not redirected internally.
    69  	PathLocationHandler http.Handler
    70  }
    71  
    72  // removeLeadingDuplicates remove leading duplicate in environments.
    73  // It's possible to override environment like following.
    74  //    cgi.Handler{
    75  //      ...
    76  //      Env: []string{"SCRIPT_FILENAME=foo.php"},
    77  //    }
    78  func removeLeadingDuplicates(env []string) (ret []string) {
    79  	n := len(env)
    80  	for i := 0; i < n; i++ {
    81  		e := env[i]
    82  		s := strings.SplitN(e, "=", 2)[0]
    83  		found := false
    84  		for j := i + 1; j < n; j++ {
    85  			if s == strings.SplitN(env[j], "=", 2)[0] {
    86  				found = true
    87  				break
    88  			}
    89  		}
    90  		if !found {
    91  			ret = append(ret, e)
    92  		}
    93  	}
    94  	return
    95  }
    96  
    97  func (h *Handler) ServeHTTP(rw http.ResponseWriter, req *http.Request) {
    98  	root := h.Root
    99  	if root == "" {
   100  		root = "/"
   101  	}
   102  
   103  	if len(req.TransferEncoding) > 0 && req.TransferEncoding[0] == "chunked" {
   104  		rw.WriteHeader(http.StatusBadRequest)
   105  		rw.Write([]byte("Chunked request bodies are not supported by CGI."))
   106  		return
   107  	}
   108  
   109  	pathInfo := req.URL.Path
   110  	if root != "/" && strings.HasPrefix(pathInfo, root) {
   111  		pathInfo = pathInfo[len(root):]
   112  	}
   113  
   114  	port := "80"
   115  	if matches := trailingPort.FindStringSubmatch(req.Host); len(matches) != 0 {
   116  		port = matches[1]
   117  	}
   118  
   119  	env := []string{
   120  		"SERVER_SOFTWARE=go",
   121  		"SERVER_NAME=" + req.Host,
   122  		"SERVER_PROTOCOL=HTTP/1.1",
   123  		"HTTP_HOST=" + req.Host,
   124  		"GATEWAY_INTERFACE=CGI/1.1",
   125  		"REQUEST_METHOD=" + req.Method,
   126  		"QUERY_STRING=" + req.URL.RawQuery,
   127  		"REQUEST_URI=" + req.URL.RequestURI(),
   128  		"PATH_INFO=" + pathInfo,
   129  		"SCRIPT_NAME=" + root,
   130  		"SCRIPT_FILENAME=" + h.Path,
   131  		"REMOTE_ADDR=" + req.RemoteAddr,
   132  		"REMOTE_HOST=" + req.RemoteAddr,
   133  		"SERVER_PORT=" + port,
   134  	}
   135  
   136  	if req.TLS != nil {
   137  		env = append(env, "HTTPS=on")
   138  	}
   139  
   140  	for k, v := range req.Header {
   141  		k = strings.Map(upperCaseAndUnderscore, k)
   142  		joinStr := ", "
   143  		if k == "COOKIE" {
   144  			joinStr = "; "
   145  		}
   146  		env = append(env, "HTTP_"+k+"="+strings.Join(v, joinStr))
   147  	}
   148  
   149  	if req.ContentLength > 0 {
   150  		env = append(env, fmt.Sprintf("CONTENT_LENGTH=%d", req.ContentLength))
   151  	}
   152  	if ctype := req.Header.Get("Content-Type"); ctype != "" {
   153  		env = append(env, "CONTENT_TYPE="+ctype)
   154  	}
   155  
   156  	if h.Env != nil {
   157  		env = append(env, h.Env...)
   158  	}
   159  
   160  	envPath := os.Getenv("PATH")
   161  	if envPath == "" {
   162  		envPath = "/bin:/usr/bin:/usr/ucb:/usr/bsd:/usr/local/bin"
   163  	}
   164  	env = append(env, "PATH="+envPath)
   165  
   166  	for _, e := range h.InheritEnv {
   167  		if v := os.Getenv(e); v != "" {
   168  			env = append(env, e+"="+v)
   169  		}
   170  	}
   171  
   172  	for _, e := range osDefaultInheritEnv[runtime.GOOS] {
   173  		if v := os.Getenv(e); v != "" {
   174  			env = append(env, e+"="+v)
   175  		}
   176  	}
   177  
   178  	env = removeLeadingDuplicates(env)
   179  
   180  	var cwd, path string
   181  	if h.Dir != "" {
   182  		path = h.Path
   183  		cwd = h.Dir
   184  	} else {
   185  		cwd, path = filepath.Split(h.Path)
   186  	}
   187  	if cwd == "" {
   188  		cwd = "."
   189  	}
   190  
   191  	internalError := func(err error) {
   192  		rw.WriteHeader(http.StatusInternalServerError)
   193  		h.printf("CGI error: %v", err)
   194  	}
   195  
   196  	cmd := &exec.Cmd{
   197  		Path:   path,
   198  		Args:   append([]string{h.Path}, h.Args...),
   199  		Dir:    cwd,
   200  		Env:    env,
   201  		Stderr: os.Stderr, // for now
   202  	}
   203  	if req.ContentLength != 0 {
   204  		cmd.Stdin = req.Body
   205  	}
   206  	stdoutRead, err := cmd.StdoutPipe()
   207  	if err != nil {
   208  		internalError(err)
   209  		return
   210  	}
   211  
   212  	err = cmd.Start()
   213  	if err != nil {
   214  		internalError(err)
   215  		return
   216  	}
   217  	defer cmd.Wait()
   218  	defer stdoutRead.Close()
   219  
   220  	linebody := bufio.NewReaderSize(stdoutRead, 1024)
   221  	headers := make(http.Header)
   222  	statusCode := 0
   223  	for {
   224  		line, isPrefix, err := linebody.ReadLine()
   225  		if isPrefix {
   226  			rw.WriteHeader(http.StatusInternalServerError)
   227  			h.printf("cgi: long header line from subprocess.")
   228  			return
   229  		}
   230  		if err == io.EOF {
   231  			break
   232  		}
   233  		if err != nil {
   234  			rw.WriteHeader(http.StatusInternalServerError)
   235  			h.printf("cgi: error reading headers: %v", err)
   236  			return
   237  		}
   238  		if len(line) == 0 {
   239  			break
   240  		}
   241  		parts := strings.SplitN(string(line), ":", 2)
   242  		if len(parts) < 2 {
   243  			h.printf("cgi: bogus header line: %s", string(line))
   244  			continue
   245  		}
   246  		header, val := parts[0], parts[1]
   247  		header = strings.TrimSpace(header)
   248  		val = strings.TrimSpace(val)
   249  		switch {
   250  		case header == "Status":
   251  			if len(val) < 3 {
   252  				h.printf("cgi: bogus status (short): %q", val)
   253  				return
   254  			}
   255  			code, err := strconv.Atoi(val[0:3])
   256  			if err != nil {
   257  				h.printf("cgi: bogus status: %q", val)
   258  				h.printf("cgi: line was %q", line)
   259  				return
   260  			}
   261  			statusCode = code
   262  		default:
   263  			headers.Add(header, val)
   264  		}
   265  	}
   266  
   267  	if loc := headers.Get("Location"); loc != "" {
   268  		if strings.HasPrefix(loc, "/") && h.PathLocationHandler != nil {
   269  			h.handleInternalRedirect(rw, req, loc)
   270  			return
   271  		}
   272  		if statusCode == 0 {
   273  			statusCode = http.StatusFound
   274  		}
   275  	}
   276  
   277  	if statusCode == 0 {
   278  		statusCode = http.StatusOK
   279  	}
   280  
   281  	// Copy headers to rw's headers, after we've decided not to
   282  	// go into handleInternalRedirect, which won't want its rw
   283  	// headers to have been touched.
   284  	for k, vv := range headers {
   285  		for _, v := range vv {
   286  			rw.Header().Add(k, v)
   287  		}
   288  	}
   289  
   290  	rw.WriteHeader(statusCode)
   291  
   292  	_, err = io.Copy(rw, linebody)
   293  	if err != nil {
   294  		h.printf("cgi: copy error: %v", err)
   295  	}
   296  }
   297  
   298  func (h *Handler) printf(format string, v ...interface{}) {
   299  	if h.Logger != nil {
   300  		h.Logger.Printf(format, v...)
   301  	} else {
   302  		log.Printf(format, v...)
   303  	}
   304  }
   305  
   306  func (h *Handler) handleInternalRedirect(rw http.ResponseWriter, req *http.Request, path string) {
   307  	url, err := req.URL.Parse(path)
   308  	if err != nil {
   309  		rw.WriteHeader(http.StatusInternalServerError)
   310  		h.printf("cgi: error resolving local URI path %q: %v", path, err)
   311  		return
   312  	}
   313  	// TODO: RFC 3875 isn't clear if only GET is supported, but it
   314  	// suggests so: "Note that any message-body attached to the
   315  	// request (such as for a POST request) may not be available
   316  	// to the resource that is the target of the redirect."  We
   317  	// should do some tests against Apache to see how it handles
   318  	// POST, HEAD, etc. Does the internal redirect get the same
   319  	// method or just GET? What about incoming headers?
   320  	// (e.g. Cookies) Which headers, if any, are copied into the
   321  	// second request?
   322  	newReq := &http.Request{
   323  		Method:     "GET",
   324  		URL:        url,
   325  		Proto:      "HTTP/1.1",
   326  		ProtoMajor: 1,
   327  		ProtoMinor: 1,
   328  		Header:     make(http.Header),
   329  		Host:       url.Host,
   330  		RemoteAddr: req.RemoteAddr,
   331  		TLS:        req.TLS,
   332  	}
   333  	h.PathLocationHandler.ServeHTTP(rw, newReq)
   334  }
   335  
   336  func upperCaseAndUnderscore(r rune) rune {
   337  	switch {
   338  	case r >= 'a' && r <= 'z':
   339  		return r - ('a' - 'A')
   340  	case r == '-':
   341  		return '_'
   342  	case r == '=':
   343  		// Maybe not part of the CGI 'spec' but would mess up
   344  		// the environment in any case, as Go represents the
   345  		// environment as a slice of "key=value" strings.
   346  		return '_'
   347  	}
   348  	// TODO: other transformations in spec or practice?
   349  	return r
   350  }