You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

556 lines
17 KiB

7 years ago
7 years ago
7 years ago
7 years ago
5 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
10 months ago
10 months ago
1 year ago
3 years ago
4 years ago
4 years ago
3 years ago
  1. package s3api
  2. import (
  3. "context"
  4. "encoding/xml"
  5. "fmt"
  6. "github.com/seaweedfs/seaweedfs/weed/glog"
  7. "github.com/seaweedfs/seaweedfs/weed/s3api/s3_constants"
  8. "io"
  9. "net/http"
  10. "net/url"
  11. "strconv"
  12. "strings"
  13. "time"
  14. "github.com/seaweedfs/seaweedfs/weed/filer"
  15. "github.com/seaweedfs/seaweedfs/weed/pb/filer_pb"
  16. "github.com/seaweedfs/seaweedfs/weed/s3api/s3err"
  17. )
  18. type ListBucketResultV2 struct {
  19. XMLName xml.Name `xml:"http://s3.amazonaws.com/doc/2006-03-01/ ListBucketResult"`
  20. Name string `xml:"Name"`
  21. Prefix string `xml:"Prefix"`
  22. MaxKeys int `xml:"MaxKeys"`
  23. Delimiter string `xml:"Delimiter,omitempty"`
  24. IsTruncated bool `xml:"IsTruncated"`
  25. Contents []ListEntry `xml:"Contents,omitempty"`
  26. CommonPrefixes []PrefixEntry `xml:"CommonPrefixes,omitempty"`
  27. ContinuationToken string `xml:"ContinuationToken,omitempty"`
  28. NextContinuationToken string `xml:"NextContinuationToken,omitempty"`
  29. KeyCount int `xml:"KeyCount"`
  30. StartAfter string `xml:"StartAfter,omitempty"`
  31. }
  32. func (s3a *S3ApiServer) ListObjectsV2Handler(w http.ResponseWriter, r *http.Request) {
  33. // https://docs.aws.amazon.com/AmazonS3/latest/API/v2-RESTBucketGET.html
  34. // collect parameters
  35. bucket, _ := s3_constants.GetBucketAndObject(r)
  36. glog.V(3).Infof("ListObjectsV2Handler %s", bucket)
  37. originalPrefix, continuationToken, startAfter, delimiter, _, maxKeys := getListObjectsV2Args(r.URL.Query())
  38. if maxKeys < 0 {
  39. s3err.WriteErrorResponse(w, r, s3err.ErrInvalidMaxKeys)
  40. return
  41. }
  42. marker := continuationToken
  43. if continuationToken == "" {
  44. marker = startAfter
  45. }
  46. response, err := s3a.listFilerEntries(bucket, originalPrefix, maxKeys, marker, delimiter)
  47. if err != nil {
  48. s3err.WriteErrorResponse(w, r, s3err.ErrInternalError)
  49. return
  50. }
  51. if len(response.Contents) == 0 {
  52. if exists, existErr := s3a.exists(s3a.option.BucketsPath, bucket, true); existErr == nil && !exists {
  53. s3err.WriteErrorResponse(w, r, s3err.ErrNoSuchBucket)
  54. return
  55. }
  56. }
  57. responseV2 := &ListBucketResultV2{
  58. XMLName: response.XMLName,
  59. Name: response.Name,
  60. CommonPrefixes: response.CommonPrefixes,
  61. Contents: response.Contents,
  62. ContinuationToken: continuationToken,
  63. Delimiter: response.Delimiter,
  64. IsTruncated: response.IsTruncated,
  65. KeyCount: len(response.Contents) + len(response.CommonPrefixes),
  66. MaxKeys: response.MaxKeys,
  67. NextContinuationToken: response.NextMarker,
  68. Prefix: response.Prefix,
  69. StartAfter: startAfter,
  70. }
  71. writeSuccessResponseXML(w, r, responseV2)
  72. }
  73. func (s3a *S3ApiServer) ListObjectsV1Handler(w http.ResponseWriter, r *http.Request) {
  74. // https://docs.aws.amazon.com/AmazonS3/latest/API/RESTBucketGET.html
  75. // collect parameters
  76. bucket, _ := s3_constants.GetBucketAndObject(r)
  77. glog.V(3).Infof("ListObjectsV1Handler %s", bucket)
  78. originalPrefix, marker, delimiter, maxKeys := getListObjectsV1Args(r.URL.Query())
  79. if maxKeys < 0 {
  80. s3err.WriteErrorResponse(w, r, s3err.ErrInvalidMaxKeys)
  81. return
  82. }
  83. response, err := s3a.listFilerEntries(bucket, originalPrefix, maxKeys, marker, delimiter)
  84. if err != nil {
  85. s3err.WriteErrorResponse(w, r, s3err.ErrInternalError)
  86. return
  87. }
  88. if len(response.Contents) == 0 {
  89. if exists, existErr := s3a.exists(s3a.option.BucketsPath, bucket, true); existErr == nil && !exists {
  90. s3err.WriteErrorResponse(w, r, s3err.ErrNoSuchBucket)
  91. return
  92. }
  93. }
  94. writeSuccessResponseXML(w, r, response)
  95. }
  96. func (s3a *S3ApiServer) listFilerEntries(bucket string, originalPrefix string, maxKeys int, originalMarker string, delimiter string) (response ListBucketResult, err error) {
  97. // convert full path prefix into directory name and prefix for entry name
  98. requestDir, prefix, marker := normalizePrefixMarker(originalPrefix, originalMarker)
  99. bucketPrefix := fmt.Sprintf("%s/%s/", s3a.option.BucketsPath, bucket)
  100. reqDir := bucketPrefix[:len(bucketPrefix)-1]
  101. if requestDir != "" {
  102. reqDir = fmt.Sprintf("%s%s", bucketPrefix, requestDir)
  103. }
  104. var contents []ListEntry
  105. var commonPrefixes []PrefixEntry
  106. var doErr error
  107. var nextMarker string
  108. cursor := &ListingCursor{
  109. maxKeys: maxKeys,
  110. prefixEndsOnDelimiter: strings.HasSuffix(originalPrefix, "/") && len(originalMarker) == 0,
  111. }
  112. if s3a.option.AllowListRecursive {
  113. err = s3a.WithFilerClient(false, func(client filer_pb.SeaweedFilerClient) error {
  114. return nil
  115. })
  116. return
  117. }
  118. // check filer
  119. err = s3a.WithFilerClient(false, func(client filer_pb.SeaweedFilerClient) error {
  120. for {
  121. empty := true
  122. nextMarker, doErr = s3a.doListFilerEntries(client, reqDir, prefix, cursor, marker, delimiter, false, func(dir string, entry *filer_pb.Entry) {
  123. empty = false
  124. if entry.IsDirectory {
  125. if entry.IsDirectoryKeyObject() {
  126. contents = append(contents, ListEntry{
  127. Key: fmt.Sprintf("%s/%s/", dir, entry.Name)[len(bucketPrefix):],
  128. LastModified: time.Unix(entry.Attributes.Mtime, 0).UTC(),
  129. ETag: "\"" + filer.ETag(entry) + "\"",
  130. Owner: CanonicalUser{
  131. ID: fmt.Sprintf("%x", entry.Attributes.Uid),
  132. DisplayName: entry.Attributes.UserName,
  133. },
  134. StorageClass: "STANDARD",
  135. })
  136. cursor.maxKeys--
  137. // https://docs.aws.amazon.com/AmazonS3/latest/API/API_ListObjectsV2.html
  138. } else if delimiter == "/" { // A response can contain CommonPrefixes only if you specify a delimiter.
  139. commonPrefixes = append(commonPrefixes, PrefixEntry{
  140. Prefix: fmt.Sprintf("%s/%s/", dir, entry.Name)[len(bucketPrefix):],
  141. })
  142. //All of the keys (up to 1,000) rolled up into a common prefix count as a single return when calculating the number of returns.
  143. cursor.maxKeys--
  144. }
  145. } else {
  146. var delimiterFound bool
  147. if delimiter != "" {
  148. // keys that contain the same string between the prefix and the first occurrence of the delimiter are grouped together as a commonPrefix.
  149. // extract the string between the prefix and the delimiter and add it to the commonPrefixes if it's unique.
  150. undelimitedPath := fmt.Sprintf("%s/%s", dir, entry.Name)[len(bucketPrefix):]
  151. // take into account a prefix if supplied while delimiting.
  152. undelimitedPath = strings.TrimPrefix(undelimitedPath, originalPrefix)
  153. delimitedPath := strings.SplitN(undelimitedPath, delimiter, 2)
  154. if len(delimitedPath) == 2 {
  155. // S3 clients expect the delimited prefix to contain the delimiter and prefix.
  156. delimitedPrefix := originalPrefix + delimitedPath[0] + delimiter
  157. for i := range commonPrefixes {
  158. if commonPrefixes[i].Prefix == delimitedPrefix {
  159. delimiterFound = true
  160. break
  161. }
  162. }
  163. if !delimiterFound {
  164. commonPrefixes = append(commonPrefixes, PrefixEntry{
  165. Prefix: delimitedPrefix,
  166. })
  167. cursor.maxKeys--
  168. delimiterFound = true
  169. }
  170. }
  171. }
  172. if !delimiterFound {
  173. storageClass := "STANDARD"
  174. if v, ok := entry.Extended[s3_constants.AmzStorageClass]; ok {
  175. storageClass = string(v)
  176. }
  177. contents = append(contents, ListEntry{
  178. Key: fmt.Sprintf("%s/%s", dir, entry.Name)[len(bucketPrefix):],
  179. LastModified: time.Unix(entry.Attributes.Mtime, 0).UTC(),
  180. ETag: "\"" + filer.ETag(entry) + "\"",
  181. Size: int64(filer.FileSize(entry)),
  182. Owner: CanonicalUser{
  183. ID: fmt.Sprintf("%x", entry.Attributes.Uid),
  184. DisplayName: entry.Attributes.UserName,
  185. },
  186. StorageClass: StorageClass(storageClass),
  187. })
  188. cursor.maxKeys--
  189. }
  190. }
  191. })
  192. if doErr != nil {
  193. return doErr
  194. }
  195. if cursor.isTruncated {
  196. if requestDir != "" {
  197. nextMarker = requestDir + "/" + nextMarker
  198. }
  199. break
  200. } else if empty || strings.HasSuffix(originalPrefix, "/") {
  201. nextMarker = ""
  202. break
  203. } else {
  204. // start next loop
  205. marker = nextMarker
  206. }
  207. }
  208. response = ListBucketResult{
  209. Name: bucket,
  210. Prefix: originalPrefix,
  211. Marker: originalMarker,
  212. NextMarker: nextMarker,
  213. MaxKeys: maxKeys,
  214. Delimiter: delimiter,
  215. IsTruncated: cursor.isTruncated,
  216. Contents: contents,
  217. CommonPrefixes: commonPrefixes,
  218. }
  219. return nil
  220. })
  221. return
  222. }
  223. type ListingCursor struct {
  224. maxKeys int
  225. isTruncated bool
  226. prefixEndsOnDelimiter bool
  227. }
  228. // the prefix and marker may be in different directories
  229. // normalizePrefixMarker ensures the prefix and marker both starts from the same directory
  230. func normalizePrefixMarker(prefix, marker string) (alignedDir, alignedPrefix, alignedMarker string) {
  231. // alignedDir should not end with "/"
  232. // alignedDir, alignedPrefix, alignedMarker should only have "/" in middle
  233. if len(marker) == 0 {
  234. prefix = strings.Trim(prefix, "/")
  235. } else {
  236. prefix = strings.TrimLeft(prefix, "/")
  237. }
  238. marker = strings.TrimLeft(marker, "/")
  239. if prefix == "" {
  240. return "", "", marker
  241. }
  242. if marker == "" {
  243. alignedDir, alignedPrefix = toDirAndName(prefix)
  244. return
  245. }
  246. if !strings.HasPrefix(marker, prefix) {
  247. // something wrong
  248. return "", prefix, marker
  249. }
  250. if strings.HasPrefix(marker, prefix+"/") {
  251. alignedDir = prefix
  252. alignedPrefix = ""
  253. alignedMarker = marker[len(alignedDir)+1:]
  254. return
  255. }
  256. alignedDir, alignedPrefix = toDirAndName(prefix)
  257. if alignedDir != "" {
  258. alignedMarker = marker[len(alignedDir)+1:]
  259. } else {
  260. alignedMarker = marker
  261. }
  262. return
  263. }
  264. func toDirAndName(dirAndName string) (dir, name string) {
  265. sepIndex := strings.LastIndex(dirAndName, "/")
  266. if sepIndex >= 0 {
  267. dir, name = dirAndName[0:sepIndex], dirAndName[sepIndex+1:]
  268. } else {
  269. name = dirAndName
  270. }
  271. return
  272. }
  273. func toParentAndDescendants(dirAndName string) (dir, name string) {
  274. sepIndex := strings.Index(dirAndName, "/")
  275. if sepIndex >= 0 {
  276. dir, name = dirAndName[0:sepIndex], dirAndName[sepIndex+1:]
  277. } else {
  278. name = dirAndName
  279. }
  280. return
  281. }
  282. func (s3a *S3ApiServer) doListFilerRecursiveEntries(client filer_pb.SeaweedFilerClient, dir, prefix string, cursor *ListingCursor, marker, delimiter string, inclusiveStartFrom bool, eachEntryFn func(dir string, entry *filer_pb.Entry)) (nextMarker string, err error) {
  283. if prefix == "/" && delimiter == "/" {
  284. return
  285. }
  286. request := &filer_pb.ListEntriesRequest{
  287. Directory: dir,
  288. Prefix: prefix,
  289. Limit: uint32(cursor.maxKeys + 2),
  290. StartFromFileName: marker,
  291. InclusiveStartFrom: inclusiveStartFrom,
  292. Recursive: true,
  293. }
  294. ctx, cancel := context.WithCancel(context.Background())
  295. defer cancel()
  296. stream, listErr := client.ListEntries(ctx, request)
  297. if listErr != nil {
  298. return "", fmt.Errorf("list entires %+v: %v", request, listErr)
  299. }
  300. for {
  301. resp, recvErr := stream.Recv()
  302. if recvErr != nil {
  303. if recvErr == io.EOF {
  304. break
  305. } else {
  306. return "", fmt.Errorf("iterating entires %+v: %v", request, recvErr)
  307. }
  308. }
  309. eachEntryFn(dir, resp.Entry)
  310. }
  311. return
  312. }
  313. func (s3a *S3ApiServer) doListFilerEntries(client filer_pb.SeaweedFilerClient, dir, prefix string, cursor *ListingCursor, marker, delimiter string, inclusiveStartFrom bool, eachEntryFn func(dir string, entry *filer_pb.Entry)) (nextMarker string, err error) {
  314. // invariants
  315. // prefix and marker should be under dir, marker may contain "/"
  316. // maxKeys should be updated for each recursion
  317. // glog.V(4).Infof("doListFilerEntries dir: %s, prefix: %s, marker %s, maxKeys: %d, prefixEndsOnDelimiter: %+v", dir, prefix, marker, cursor.maxKeys, cursor.prefixEndsOnDelimiter)
  318. if prefix == "/" && delimiter == "/" {
  319. return
  320. }
  321. if cursor.maxKeys <= 0 {
  322. return
  323. }
  324. if strings.Contains(marker, "/") {
  325. subDir, subMarker := toParentAndDescendants(marker)
  326. // println("doListFilerEntries dir", dir+"/"+subDir, "subMarker", subMarker)
  327. subNextMarker, subErr := s3a.doListFilerEntries(client, dir+"/"+subDir, "", cursor, subMarker, delimiter, false, eachEntryFn)
  328. if subErr != nil {
  329. err = subErr
  330. return
  331. }
  332. nextMarker = subDir + "/" + subNextMarker
  333. // finished processing this subdirectory
  334. marker = subDir
  335. }
  336. if cursor.isTruncated {
  337. return
  338. }
  339. // now marker is also a direct child of dir
  340. request := &filer_pb.ListEntriesRequest{
  341. Directory: dir,
  342. Prefix: prefix,
  343. Limit: uint32(cursor.maxKeys + 2), // bucket root directory needs to skip additional s3_constants.MultipartUploadsFolder folder
  344. StartFromFileName: marker,
  345. InclusiveStartFrom: inclusiveStartFrom,
  346. }
  347. if cursor.prefixEndsOnDelimiter {
  348. request.Limit = uint32(1)
  349. }
  350. ctx, cancel := context.WithCancel(context.Background())
  351. defer cancel()
  352. stream, listErr := client.ListEntries(ctx, request)
  353. if listErr != nil {
  354. err = fmt.Errorf("list entires %+v: %v", request, listErr)
  355. return
  356. }
  357. for {
  358. resp, recvErr := stream.Recv()
  359. if recvErr != nil {
  360. if recvErr == io.EOF {
  361. break
  362. } else {
  363. err = fmt.Errorf("iterating entires %+v: %v", request, recvErr)
  364. return
  365. }
  366. }
  367. if cursor.maxKeys <= 0 {
  368. cursor.isTruncated = true
  369. continue
  370. }
  371. entry := resp.Entry
  372. nextMarker = entry.Name
  373. if cursor.prefixEndsOnDelimiter {
  374. if entry.Name == prefix && entry.IsDirectory {
  375. if delimiter != "/" {
  376. cursor.prefixEndsOnDelimiter = false
  377. }
  378. } else {
  379. continue
  380. }
  381. }
  382. if entry.IsDirectory {
  383. // glog.V(4).Infof("List Dir Entries %s, file: %s, maxKeys %d", dir, entry.Name, cursor.maxKeys)
  384. if entry.Name == s3_constants.MultipartUploadsFolder { // FIXME no need to apply to all directories. this extra also affects maxKeys
  385. continue
  386. }
  387. if delimiter != "/" || cursor.prefixEndsOnDelimiter {
  388. if cursor.prefixEndsOnDelimiter {
  389. cursor.prefixEndsOnDelimiter = false
  390. if entry.IsDirectoryKeyObject() {
  391. eachEntryFn(dir, entry)
  392. }
  393. } else {
  394. eachEntryFn(dir, entry)
  395. }
  396. subNextMarker, subErr := s3a.doListFilerEntries(client, dir+"/"+entry.Name, "", cursor, "", delimiter, false, eachEntryFn)
  397. if subErr != nil {
  398. err = fmt.Errorf("doListFilerEntries2: %v", subErr)
  399. return
  400. }
  401. // println("doListFilerEntries2 dir", dir+"/"+entry.Name, "subNextMarker", subNextMarker)
  402. nextMarker = entry.Name + "/" + subNextMarker
  403. if cursor.isTruncated {
  404. return
  405. }
  406. // println("doListFilerEntries2 nextMarker", nextMarker)
  407. } else {
  408. var isEmpty bool
  409. if !s3a.option.AllowEmptyFolder && entry.IsOlderDir() {
  410. //if isEmpty, err = s3a.ensureDirectoryAllEmpty(client, dir, entry.Name); err != nil {
  411. // glog.Errorf("check empty folder %s: %v", dir, err)
  412. //}
  413. }
  414. if !isEmpty {
  415. eachEntryFn(dir, entry)
  416. }
  417. }
  418. } else {
  419. eachEntryFn(dir, entry)
  420. // glog.V(4).Infof("List File Entries %s, file: %s, maxKeys %d", dir, entry.Name, cursor.maxKeys)
  421. }
  422. if cursor.prefixEndsOnDelimiter {
  423. cursor.prefixEndsOnDelimiter = false
  424. }
  425. }
  426. return
  427. }
  428. func getListObjectsV2Args(values url.Values) (prefix, token, startAfter, delimiter string, fetchOwner bool, maxkeys int) {
  429. prefix = values.Get("prefix")
  430. token = values.Get("continuation-token")
  431. startAfter = values.Get("start-after")
  432. delimiter = values.Get("delimiter")
  433. if values.Get("max-keys") != "" {
  434. maxkeys, _ = strconv.Atoi(values.Get("max-keys"))
  435. } else {
  436. maxkeys = maxObjectListSizeLimit
  437. }
  438. fetchOwner = values.Get("fetch-owner") == "true"
  439. return
  440. }
  441. func getListObjectsV1Args(values url.Values) (prefix, marker, delimiter string, maxkeys int) {
  442. prefix = values.Get("prefix")
  443. marker = values.Get("marker")
  444. delimiter = values.Get("delimiter")
  445. if values.Get("max-keys") != "" {
  446. maxkeys, _ = strconv.Atoi(values.Get("max-keys"))
  447. } else {
  448. maxkeys = maxObjectListSizeLimit
  449. }
  450. return
  451. }
  452. func (s3a *S3ApiServer) ensureDirectoryAllEmpty(filerClient filer_pb.SeaweedFilerClient, parentDir, name string) (isEmpty bool, err error) {
  453. // println("+ ensureDirectoryAllEmpty", dir, name)
  454. glog.V(4).Infof("+ isEmpty %s/%s", parentDir, name)
  455. defer glog.V(4).Infof("- isEmpty %s/%s %v", parentDir, name, isEmpty)
  456. var fileCounter int
  457. var subDirs []string
  458. currentDir := parentDir + "/" + name
  459. var startFrom string
  460. var isExhausted bool
  461. var foundEntry bool
  462. for fileCounter == 0 && !isExhausted && err == nil {
  463. err = filer_pb.SeaweedList(filerClient, currentDir, "", func(entry *filer_pb.Entry, isLast bool) error {
  464. foundEntry = true
  465. if entry.IsOlderDir() {
  466. subDirs = append(subDirs, entry.Name)
  467. } else {
  468. fileCounter++
  469. }
  470. startFrom = entry.Name
  471. isExhausted = isExhausted || isLast
  472. glog.V(4).Infof(" * %s/%s isLast: %t", currentDir, startFrom, isLast)
  473. return nil
  474. }, startFrom, false, 8)
  475. if !foundEntry {
  476. break
  477. }
  478. }
  479. if err != nil {
  480. return false, err
  481. }
  482. if fileCounter > 0 {
  483. return false, nil
  484. }
  485. for _, subDir := range subDirs {
  486. isSubEmpty, subErr := s3a.ensureDirectoryAllEmpty(filerClient, currentDir, subDir)
  487. if subErr != nil {
  488. return false, subErr
  489. }
  490. if !isSubEmpty {
  491. return false, nil
  492. }
  493. }
  494. glog.V(1).Infof("deleting empty folder %s", currentDir)
  495. if err = doDeleteEntry(filerClient, parentDir, name, true, false); err != nil {
  496. return
  497. }
  498. return true, nil
  499. }