You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

217 lines
5.4 KiB

12 years ago
12 years ago
12 years ago
12 years ago
12 years ago
12 years ago
  1. package storage
  2. import (
  3. "encoding/hex"
  4. "errors"
  5. "fmt"
  6. "io/ioutil"
  7. "mime"
  8. "net/http"
  9. "path"
  10. "strconv"
  11. "strings"
  12. "time"
  13. "github.com/chrislusf/seaweedfs/go/glog"
  14. "github.com/chrislusf/seaweedfs/go/images"
  15. "github.com/chrislusf/seaweedfs/go/util"
  16. )
  17. const (
  18. NeedleHeaderSize = 16 //should never change this
  19. NeedlePaddingSize = 8
  20. NeedleChecksumSize = 4
  21. MaxPossibleVolumeSize = 4 * 1024 * 1024 * 1024 * 8
  22. )
  23. /*
  24. * A Needle means a uploaded and stored file.
  25. * Needle file size is limited to 4GB for now.
  26. */
  27. type Needle struct {
  28. Cookie uint32 `comment:"random number to mitigate brute force lookups"`
  29. Id uint64 `comment:"needle id"`
  30. Size uint32 `comment:"sum of DataSize,Data,NameSize,Name,MimeSize,Mime"`
  31. DataSize uint32 `comment:"Data size"` //version2
  32. Data []byte `comment:"The actual file data"`
  33. Flags byte `comment:"boolean flags"` //version2
  34. NameSize uint8 //version2
  35. Name []byte `comment:"maximum 256 characters"` //version2
  36. MimeSize uint8 //version2
  37. Mime []byte `comment:"maximum 256 characters"` //version2
  38. LastModified uint64 //only store LastModifiedBytesLength bytes, which is 5 bytes to disk
  39. Ttl *TTL
  40. Checksum CRC `comment:"CRC32 to check integrity"`
  41. Padding []byte `comment:"Aligned to 8 bytes"`
  42. }
  43. func (n *Needle) String() (str string) {
  44. str = fmt.Sprintf("Cookie:%d, Id:%d, Size:%d, DataSize:%d, Name: %s, Mime: %s", n.Cookie, n.Id, n.Size, n.DataSize, n.Name, n.Mime)
  45. return
  46. }
  47. func ParseUpload(r *http.Request) (fileName string, data []byte, mimeType string, isGzipped bool, modifiedTime uint64, ttl *TTL, e error) {
  48. form, fe := r.MultipartReader()
  49. if fe != nil {
  50. glog.V(0).Infoln("MultipartReader [ERROR]", fe)
  51. e = fe
  52. return
  53. }
  54. //first multi-part item
  55. part, fe := form.NextPart()
  56. if fe != nil {
  57. glog.V(0).Infoln("Reading Multi part [ERROR]", fe)
  58. e = fe
  59. return
  60. }
  61. fileName = part.FileName()
  62. if fileName != "" {
  63. fileName = path.Base(fileName)
  64. }
  65. data, e = ioutil.ReadAll(part)
  66. if e != nil {
  67. glog.V(0).Infoln("Reading Content [ERROR]", e)
  68. return
  69. }
  70. //if the filename is empty string, do a search on the other multi-part items
  71. for fileName == "" {
  72. part2, fe := form.NextPart()
  73. if fe != nil {
  74. break // no more or on error, just safely break
  75. }
  76. fName := part2.FileName()
  77. //found the first <file type> multi-part has filename
  78. if fName != "" {
  79. data2, fe2 := ioutil.ReadAll(part2)
  80. if fe2 != nil {
  81. glog.V(0).Infoln("Reading Content [ERROR]", fe2)
  82. e = fe2
  83. return
  84. }
  85. //update
  86. data = data2
  87. fileName = path.Base(fName)
  88. break
  89. }
  90. }
  91. dotIndex := strings.LastIndex(fileName, ".")
  92. ext, mtype := "", ""
  93. if dotIndex > 0 {
  94. ext = strings.ToLower(fileName[dotIndex:])
  95. mtype = mime.TypeByExtension(ext)
  96. }
  97. contentType := part.Header.Get("Content-Type")
  98. if contentType != "" && mtype != contentType {
  99. mimeType = contentType //only return mime type if not deductable
  100. mtype = contentType
  101. }
  102. if part.Header.Get("Content-Encoding") == "gzip" {
  103. isGzipped = true
  104. } else if IsGzippable(ext, mtype) {
  105. if data, e = GzipData(data); e != nil {
  106. return
  107. }
  108. isGzipped = true
  109. }
  110. if ext == ".gz" {
  111. isGzipped = true
  112. }
  113. if strings.HasSuffix(fileName, ".gz") &&
  114. !strings.HasSuffix(fileName, ".tar.gz") {
  115. fileName = fileName[:len(fileName)-3]
  116. }
  117. modifiedTime, _ = strconv.ParseUint(r.FormValue("ts"), 10, 64)
  118. ttl, _ = ReadTTL(r.FormValue("ttl"))
  119. return
  120. }
  121. func NewNeedle(r *http.Request, fixJpgOrientation bool) (n *Needle, e error) {
  122. fname, mimeType, isGzipped := "", "", false
  123. n = new(Needle)
  124. fname, n.Data, mimeType, isGzipped, n.LastModified, n.Ttl, e = ParseUpload(r)
  125. if e != nil {
  126. return
  127. }
  128. if len(fname) < 256 {
  129. n.Name = []byte(fname)
  130. n.SetHasName()
  131. }
  132. if len(mimeType) < 256 {
  133. n.Mime = []byte(mimeType)
  134. n.SetHasMime()
  135. }
  136. if isGzipped {
  137. n.SetGzipped()
  138. }
  139. if n.LastModified == 0 {
  140. n.LastModified = uint64(time.Now().Unix())
  141. }
  142. n.SetHasLastModifiedDate()
  143. if n.Ttl != EMPTY_TTL {
  144. n.SetHasTtl()
  145. }
  146. if fixJpgOrientation {
  147. loweredName := strings.ToLower(fname)
  148. if mimeType == "image/jpeg" || strings.HasSuffix(loweredName, ".jpg") || strings.HasSuffix(loweredName, ".jpeg") {
  149. n.Data = images.FixJpgOrientation(n.Data)
  150. }
  151. }
  152. n.Checksum = NewCRC(n.Data)
  153. commaSep := strings.LastIndex(r.URL.Path, ",")
  154. dotSep := strings.LastIndex(r.URL.Path, ".")
  155. fid := r.URL.Path[commaSep+1:]
  156. if dotSep > 0 {
  157. fid = r.URL.Path[commaSep+1 : dotSep]
  158. }
  159. e = n.ParsePath(fid)
  160. return
  161. }
  162. func (n *Needle) ParsePath(fid string) (err error) {
  163. length := len(fid)
  164. if length <= 8 {
  165. return errors.New("Invalid fid:" + fid)
  166. }
  167. delta := ""
  168. deltaIndex := strings.LastIndex(fid, "_")
  169. if deltaIndex > 0 {
  170. fid, delta = fid[0:deltaIndex], fid[deltaIndex+1:]
  171. }
  172. n.Id, n.Cookie, err = ParseKeyHash(fid)
  173. if err != nil {
  174. return err
  175. }
  176. if delta != "" {
  177. if d, e := strconv.ParseUint(delta, 10, 64); e == nil {
  178. n.Id += d
  179. } else {
  180. return e
  181. }
  182. }
  183. return err
  184. }
  185. func ParseKeyHash(key_hash_string string) (uint64, uint32, error) {
  186. key_hash_bytes, khe := hex.DecodeString(key_hash_string)
  187. key_hash_len := len(key_hash_bytes)
  188. if khe != nil || key_hash_len <= 4 {
  189. glog.V(0).Infoln("Invalid key_hash", key_hash_string, "length:", key_hash_len, "error", khe)
  190. return 0, 0, errors.New("Invalid key and hash:" + key_hash_string)
  191. }
  192. key := util.BytesToUint64(key_hash_bytes[0 : key_hash_len-4])
  193. hash := util.BytesToUint32(key_hash_bytes[key_hash_len-4 : key_hash_len])
  194. return key, hash, nil
  195. }