You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

586 lines
18 KiB

7 years ago
7 years ago
7 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
9 months ago
9 months ago
9 months ago
9 months ago
1 year ago
3 years ago
4 years ago
4 years ago
3 years ago
  1. package s3api
  2. import (
  3. "context"
  4. "encoding/xml"
  5. "fmt"
  6. "github.com/aws/aws-sdk-go/service/s3"
  7. "github.com/seaweedfs/seaweedfs/weed/glog"
  8. "github.com/seaweedfs/seaweedfs/weed/pb/filer_pb"
  9. "github.com/seaweedfs/seaweedfs/weed/s3api/s3_constants"
  10. "github.com/seaweedfs/seaweedfs/weed/s3api/s3err"
  11. "io"
  12. "net/http"
  13. "net/url"
  14. "sort"
  15. "strconv"
  16. "strings"
  17. )
  18. type OptionalString struct {
  19. string
  20. set bool
  21. }
  22. func (o OptionalString) MarshalXML(e *xml.Encoder, startElement xml.StartElement) error {
  23. if !o.set {
  24. return nil
  25. }
  26. return e.EncodeElement(o.string, startElement)
  27. }
  28. type ListBucketResultV2 struct {
  29. XMLName xml.Name `xml:"http://s3.amazonaws.com/doc/2006-03-01/ ListBucketResult"`
  30. Name string `xml:"Name"`
  31. Prefix string `xml:"Prefix"`
  32. MaxKeys int `xml:"MaxKeys"`
  33. Delimiter string `xml:"Delimiter,omitempty"`
  34. IsTruncated bool `xml:"IsTruncated"`
  35. Contents []ListEntry `xml:"Contents,omitempty"`
  36. CommonPrefixes []PrefixEntry `xml:"CommonPrefixes,omitempty"`
  37. ContinuationToken OptionalString `xml:"ContinuationToken,omitempty"`
  38. NextContinuationToken string `xml:"NextContinuationToken,omitempty"`
  39. EncodingType string `xml:"EncodingType,omitempty"`
  40. KeyCount int `xml:"KeyCount"`
  41. StartAfter string `xml:"StartAfter,omitempty"`
  42. }
  43. func (s3a *S3ApiServer) ListObjectsV2Handler(w http.ResponseWriter, r *http.Request) {
  44. // https://docs.aws.amazon.com/AmazonS3/latest/API/v2-RESTBucketGET.html
  45. // collect parameters
  46. bucket, _ := s3_constants.GetBucketAndObject(r)
  47. glog.V(3).Infof("ListObjectsV2Handler %s", bucket)
  48. originalPrefix, startAfter, delimiter, continuationToken, encodingTypeUrl, fetchOwner, maxKeys := getListObjectsV2Args(r.URL.Query())
  49. if maxKeys < 0 {
  50. s3err.WriteErrorResponse(w, r, s3err.ErrInvalidMaxKeys)
  51. return
  52. }
  53. marker := continuationToken.string
  54. if !continuationToken.set {
  55. marker = startAfter
  56. }
  57. response, err := s3a.listFilerEntries(bucket, originalPrefix, maxKeys, marker, delimiter, encodingTypeUrl, fetchOwner)
  58. if err != nil {
  59. s3err.WriteErrorResponse(w, r, s3err.ErrInternalError)
  60. return
  61. }
  62. if len(response.Contents) == 0 {
  63. if exists, existErr := s3a.exists(s3a.option.BucketsPath, bucket, true); existErr == nil && !exists {
  64. s3err.WriteErrorResponse(w, r, s3err.ErrNoSuchBucket)
  65. return
  66. }
  67. }
  68. responseV2 := &ListBucketResultV2{
  69. XMLName: response.XMLName,
  70. Name: response.Name,
  71. CommonPrefixes: response.CommonPrefixes,
  72. Contents: response.Contents,
  73. ContinuationToken: continuationToken,
  74. Delimiter: response.Delimiter,
  75. IsTruncated: response.IsTruncated,
  76. KeyCount: len(response.Contents) + len(response.CommonPrefixes),
  77. MaxKeys: response.MaxKeys,
  78. NextContinuationToken: response.NextMarker,
  79. Prefix: response.Prefix,
  80. StartAfter: startAfter,
  81. }
  82. if encodingTypeUrl {
  83. responseV2.EncodingType = s3.EncodingTypeUrl
  84. }
  85. writeSuccessResponseXML(w, r, responseV2)
  86. }
  87. func (s3a *S3ApiServer) ListObjectsV1Handler(w http.ResponseWriter, r *http.Request) {
  88. // https://docs.aws.amazon.com/AmazonS3/latest/API/RESTBucketGET.html
  89. // collect parameters
  90. bucket, _ := s3_constants.GetBucketAndObject(r)
  91. glog.V(3).Infof("ListObjectsV1Handler %s", bucket)
  92. originalPrefix, marker, delimiter, encodingTypeUrl, maxKeys := getListObjectsV1Args(r.URL.Query())
  93. if maxKeys < 0 {
  94. s3err.WriteErrorResponse(w, r, s3err.ErrInvalidMaxKeys)
  95. return
  96. }
  97. response, err := s3a.listFilerEntries(bucket, originalPrefix, maxKeys, marker, delimiter, encodingTypeUrl, true)
  98. if err != nil {
  99. s3err.WriteErrorResponse(w, r, s3err.ErrInternalError)
  100. return
  101. }
  102. if len(response.Contents) == 0 {
  103. if exists, existErr := s3a.exists(s3a.option.BucketsPath, bucket, true); existErr == nil && !exists {
  104. s3err.WriteErrorResponse(w, r, s3err.ErrNoSuchBucket)
  105. return
  106. }
  107. }
  108. writeSuccessResponseXML(w, r, response)
  109. }
  110. func (s3a *S3ApiServer) listFilerEntries(bucket string, originalPrefix string, maxKeys int, originalMarker string, delimiter string, encodingTypeUrl bool, fetchOwner bool) (response ListBucketResult, err error) {
  111. // convert full path prefix into directory name and prefix for entry name
  112. requestDir, prefix, marker := normalizePrefixMarker(originalPrefix, originalMarker)
  113. bucketPrefix := fmt.Sprintf("%s/%s/", s3a.option.BucketsPath, bucket)
  114. reqDir := bucketPrefix[:len(bucketPrefix)-1]
  115. if requestDir != "" {
  116. reqDir = fmt.Sprintf("%s%s", bucketPrefix, requestDir)
  117. }
  118. var contents []ListEntry
  119. var commonPrefixes []PrefixEntry
  120. var doErr error
  121. var nextMarker string
  122. cursor := &ListingCursor{
  123. maxKeys: maxKeys,
  124. prefixEndsOnDelimiter: strings.HasSuffix(originalPrefix, "/") && len(originalMarker) == 0,
  125. }
  126. // Todo remove force disable
  127. if s3a.option.AllowListRecursive && prefix == "force_disable" {
  128. err = s3a.WithFilerClient(false, func(client filer_pb.SeaweedFilerClient) error {
  129. glog.V(0).Infof("doListFilerRecursiveEntries reqDir: %s, prefix: %s, delimiter: %s, cursor: %+v", reqDir, prefix, delimiter, cursor)
  130. nextMarker, doErr = s3a.doListFilerRecursiveEntries(client, reqDir, prefix, cursor, marker, delimiter, false,
  131. func(dir string, entry *filer_pb.Entry) {
  132. dirName, entryName, prefixName := entryUrlEncode(dir, entry.Name, encodingTypeUrl)
  133. if entry.IsDirectory {
  134. if delimiter == "/" { // A response can contain CommonPrefixes only if you specify a delimiter.
  135. commonPrefixes = append(commonPrefixes, PrefixEntry{
  136. Prefix: fmt.Sprintf("%s/%s/", dirName, prefixName)[len(bucketPrefix):],
  137. })
  138. }
  139. return
  140. }
  141. contents = append(contents, newListEntry(entry, dirName, entryName, bucketPrefix, fetchOwner, entry.IsDirectoryKeyObject()))
  142. cursor.maxKeys--
  143. },
  144. )
  145. return nil
  146. })
  147. response = ListBucketResult{
  148. Name: bucket,
  149. Prefix: originalPrefix,
  150. Marker: originalMarker,
  151. NextMarker: nextMarker,
  152. MaxKeys: maxKeys,
  153. Delimiter: delimiter,
  154. IsTruncated: cursor.isTruncated,
  155. Contents: contents,
  156. CommonPrefixes: commonPrefixes,
  157. }
  158. if encodingTypeUrl {
  159. response.EncodingType = s3.EncodingTypeUrl
  160. }
  161. return
  162. }
  163. // check filer
  164. err = s3a.WithFilerClient(false, func(client filer_pb.SeaweedFilerClient) error {
  165. for {
  166. empty := true
  167. nextMarker, doErr = s3a.doListFilerEntries(client, reqDir, prefix, cursor, marker, delimiter, false, func(dir string, entry *filer_pb.Entry) {
  168. empty = false
  169. glog.V(5).Infof("doListFilerEntries dir: %s entry: %+v", dir, entry)
  170. dirName, entryName, prefixName := entryUrlEncode(dir, entry.Name, encodingTypeUrl)
  171. if entry.IsDirectory {
  172. if entry.IsDirectoryKeyObject() {
  173. contents = append(contents, newListEntry(entry, dirName, entryName, bucketPrefix, fetchOwner, true))
  174. cursor.maxKeys--
  175. // https://docs.aws.amazon.com/AmazonS3/latest/API/API_ListObjectsV2.html
  176. } else if delimiter == "/" { // A response can contain CommonPrefixes only if you specify a delimiter.
  177. commonPrefixes = append(commonPrefixes, PrefixEntry{
  178. Prefix: fmt.Sprintf("%s/%s/", dirName, prefixName)[len(bucketPrefix):],
  179. })
  180. //All of the keys (up to 1,000) rolled up into a common prefix count as a single return when calculating the number of returns.
  181. cursor.maxKeys--
  182. }
  183. } else {
  184. var delimiterFound bool
  185. if delimiter != "" {
  186. // keys that contain the same string between the prefix and the first occurrence of the delimiter are grouped together as a commonPrefix.
  187. // extract the string between the prefix and the delimiter and add it to the commonPrefixes if it's unique.
  188. undelimitedPath := fmt.Sprintf("%s/%s", dir, entry.Name)[len(bucketPrefix):]
  189. // take into account a prefix if supplied while delimiting.
  190. undelimitedPath = strings.TrimPrefix(undelimitedPath, originalPrefix)
  191. delimitedPath := strings.SplitN(undelimitedPath, delimiter, 2)
  192. if len(delimitedPath) == 2 {
  193. // S3 clients expect the delimited prefix to contain the delimiter and prefix.
  194. delimitedPrefix := originalPrefix + delimitedPath[0] + delimiter
  195. for i := range commonPrefixes {
  196. if commonPrefixes[i].Prefix == delimitedPrefix {
  197. delimiterFound = true
  198. break
  199. }
  200. }
  201. if !delimiterFound {
  202. commonPrefixes = append(commonPrefixes, PrefixEntry{
  203. Prefix: delimitedPrefix,
  204. })
  205. cursor.maxKeys--
  206. delimiterFound = true
  207. }
  208. }
  209. }
  210. if !delimiterFound {
  211. contents = append(contents, newListEntry(entry, dirName, entryName, bucketPrefix, fetchOwner, false))
  212. cursor.maxKeys--
  213. }
  214. }
  215. })
  216. if doErr != nil {
  217. return doErr
  218. }
  219. if cursor.isTruncated {
  220. if requestDir != "" {
  221. nextMarker = requestDir + "/" + nextMarker
  222. }
  223. break
  224. } else if empty || strings.HasSuffix(originalPrefix, "/") {
  225. nextMarker = ""
  226. break
  227. } else {
  228. // start next loop
  229. marker = nextMarker
  230. }
  231. }
  232. response = ListBucketResult{
  233. Name: bucket,
  234. Prefix: originalPrefix,
  235. Marker: originalMarker,
  236. NextMarker: nextMarker,
  237. MaxKeys: maxKeys,
  238. Delimiter: delimiter,
  239. IsTruncated: cursor.isTruncated,
  240. Contents: contents,
  241. CommonPrefixes: commonPrefixes,
  242. }
  243. if encodingTypeUrl {
  244. sort.Slice(response.CommonPrefixes, func(i, j int) bool {
  245. return response.CommonPrefixes[i].Prefix < response.CommonPrefixes[j].Prefix
  246. })
  247. response.EncodingType = s3.EncodingTypeUrl
  248. }
  249. return nil
  250. })
  251. return
  252. }
  253. type ListingCursor struct {
  254. maxKeys int
  255. isTruncated bool
  256. prefixEndsOnDelimiter bool
  257. }
  258. // the prefix and marker may be in different directories
  259. // normalizePrefixMarker ensures the prefix and marker both starts from the same directory
  260. func normalizePrefixMarker(prefix, marker string) (alignedDir, alignedPrefix, alignedMarker string) {
  261. // alignedDir should not end with "/"
  262. // alignedDir, alignedPrefix, alignedMarker should only have "/" in middle
  263. if len(marker) == 0 {
  264. prefix = strings.Trim(prefix, "/")
  265. } else {
  266. prefix = strings.TrimLeft(prefix, "/")
  267. }
  268. marker = strings.TrimLeft(marker, "/")
  269. if prefix == "" {
  270. return "", "", marker
  271. }
  272. if marker == "" {
  273. alignedDir, alignedPrefix = toDirAndName(prefix)
  274. return
  275. }
  276. if !strings.HasPrefix(marker, prefix) {
  277. // something wrong
  278. return "", prefix, marker
  279. }
  280. if strings.HasPrefix(marker, prefix+"/") {
  281. alignedDir = prefix
  282. alignedPrefix = ""
  283. alignedMarker = marker[len(alignedDir)+1:]
  284. return
  285. }
  286. alignedDir, alignedPrefix = toDirAndName(prefix)
  287. if alignedDir != "" {
  288. alignedMarker = marker[len(alignedDir)+1:]
  289. } else {
  290. alignedMarker = marker
  291. }
  292. return
  293. }
  294. func toDirAndName(dirAndName string) (dir, name string) {
  295. sepIndex := strings.LastIndex(dirAndName, "/")
  296. if sepIndex >= 0 {
  297. dir, name = dirAndName[0:sepIndex], dirAndName[sepIndex+1:]
  298. } else {
  299. name = dirAndName
  300. }
  301. return
  302. }
  303. func toParentAndDescendants(dirAndName string) (dir, name string) {
  304. sepIndex := strings.Index(dirAndName, "/")
  305. if sepIndex >= 0 {
  306. dir, name = dirAndName[0:sepIndex], dirAndName[sepIndex+1:]
  307. } else {
  308. name = dirAndName
  309. }
  310. return
  311. }
  312. func (s3a *S3ApiServer) doListFilerRecursiveEntries(client filer_pb.SeaweedFilerClient, dir, prefix string, cursor *ListingCursor, marker, delimiter string, inclusiveStartFrom bool, eachEntryFn func(dir string, entry *filer_pb.Entry)) (nextMarker string, err error) {
  313. if prefix == "/" && delimiter == "/" {
  314. return
  315. }
  316. request := &filer_pb.ListEntriesRequest{
  317. Directory: dir,
  318. Prefix: prefix,
  319. Limit: uint32(cursor.maxKeys + 2),
  320. StartFromFileName: marker,
  321. InclusiveStartFrom: inclusiveStartFrom,
  322. Recursive: true,
  323. }
  324. ctx, cancel := context.WithCancel(context.Background())
  325. defer cancel()
  326. stream, listErr := client.ListEntries(ctx, request)
  327. if listErr != nil {
  328. return "", fmt.Errorf("list entires %+v: %v", request, listErr)
  329. }
  330. for {
  331. resp, recvErr := stream.Recv()
  332. if recvErr != nil {
  333. if recvErr == io.EOF {
  334. break
  335. } else {
  336. return "", fmt.Errorf("iterating entires %+v: %v", request, recvErr)
  337. }
  338. }
  339. eachEntryFn(dir, resp.Entry)
  340. }
  341. return
  342. }
  343. func (s3a *S3ApiServer) doListFilerEntries(client filer_pb.SeaweedFilerClient, dir, prefix string, cursor *ListingCursor, marker, delimiter string, inclusiveStartFrom bool, eachEntryFn func(dir string, entry *filer_pb.Entry)) (nextMarker string, err error) {
  344. // invariants
  345. // prefix and marker should be under dir, marker may contain "/"
  346. // maxKeys should be updated for each recursion
  347. // glog.V(4).Infof("doListFilerEntries dir: %s, prefix: %s, marker %s, maxKeys: %d, prefixEndsOnDelimiter: %+v", dir, prefix, marker, cursor.maxKeys, cursor.prefixEndsOnDelimiter)
  348. if prefix == "/" && delimiter == "/" {
  349. return
  350. }
  351. if cursor.maxKeys <= 0 {
  352. return
  353. }
  354. if strings.Contains(marker, "/") {
  355. subDir, subMarker := toParentAndDescendants(marker)
  356. // println("doListFilerEntries dir", dir+"/"+subDir, "subMarker", subMarker)
  357. subNextMarker, subErr := s3a.doListFilerEntries(client, dir+"/"+subDir, "", cursor, subMarker, delimiter, false, eachEntryFn)
  358. if subErr != nil {
  359. err = subErr
  360. return
  361. }
  362. nextMarker = subDir + "/" + subNextMarker
  363. // finished processing this subdirectory
  364. marker = subDir
  365. }
  366. if cursor.isTruncated {
  367. return
  368. }
  369. // now marker is also a direct child of dir
  370. request := &filer_pb.ListEntriesRequest{
  371. Directory: dir,
  372. Prefix: prefix,
  373. Limit: uint32(cursor.maxKeys + 2), // bucket root directory needs to skip additional s3_constants.MultipartUploadsFolder folder
  374. StartFromFileName: marker,
  375. InclusiveStartFrom: inclusiveStartFrom,
  376. }
  377. if cursor.prefixEndsOnDelimiter {
  378. request.Limit = uint32(1)
  379. }
  380. ctx, cancel := context.WithCancel(context.Background())
  381. defer cancel()
  382. stream, listErr := client.ListEntries(ctx, request)
  383. if listErr != nil {
  384. err = fmt.Errorf("list entires %+v: %v", request, listErr)
  385. return
  386. }
  387. for {
  388. resp, recvErr := stream.Recv()
  389. if recvErr != nil {
  390. if recvErr == io.EOF {
  391. break
  392. } else {
  393. err = fmt.Errorf("iterating entires %+v: %v", request, recvErr)
  394. return
  395. }
  396. }
  397. if cursor.maxKeys <= 0 {
  398. cursor.isTruncated = true
  399. continue
  400. }
  401. entry := resp.Entry
  402. nextMarker = entry.Name
  403. if cursor.prefixEndsOnDelimiter {
  404. if entry.Name == prefix && entry.IsDirectory {
  405. if delimiter != "/" {
  406. cursor.prefixEndsOnDelimiter = false
  407. }
  408. } else {
  409. continue
  410. }
  411. }
  412. if entry.IsDirectory {
  413. // glog.V(4).Infof("List Dir Entries %s, file: %s, maxKeys %d", dir, entry.Name, cursor.maxKeys)
  414. if entry.Name == s3_constants.MultipartUploadsFolder { // FIXME no need to apply to all directories. this extra also affects maxKeys
  415. continue
  416. }
  417. if delimiter != "/" || cursor.prefixEndsOnDelimiter {
  418. if cursor.prefixEndsOnDelimiter {
  419. cursor.prefixEndsOnDelimiter = false
  420. if entry.IsDirectoryKeyObject() {
  421. eachEntryFn(dir, entry)
  422. }
  423. } else {
  424. eachEntryFn(dir, entry)
  425. }
  426. subNextMarker, subErr := s3a.doListFilerEntries(client, dir+"/"+entry.Name, "", cursor, "", delimiter, false, eachEntryFn)
  427. if subErr != nil {
  428. err = fmt.Errorf("doListFilerEntries2: %v", subErr)
  429. return
  430. }
  431. // println("doListFilerEntries2 dir", dir+"/"+entry.Name, "subNextMarker", subNextMarker)
  432. nextMarker = entry.Name + "/" + subNextMarker
  433. if cursor.isTruncated {
  434. return
  435. }
  436. // println("doListFilerEntries2 nextMarker", nextMarker)
  437. } else {
  438. var isEmpty bool
  439. if !s3a.option.AllowEmptyFolder && entry.IsOlderDir() {
  440. //if isEmpty, err = s3a.ensureDirectoryAllEmpty(client, dir, entry.Name); err != nil {
  441. // glog.Errorf("check empty folder %s: %v", dir, err)
  442. //}
  443. }
  444. if !isEmpty {
  445. eachEntryFn(dir, entry)
  446. }
  447. }
  448. } else {
  449. eachEntryFn(dir, entry)
  450. // glog.V(4).Infof("List File Entries %s, file: %s, maxKeys %d", dir, entry.Name, cursor.maxKeys)
  451. }
  452. if cursor.prefixEndsOnDelimiter {
  453. cursor.prefixEndsOnDelimiter = false
  454. }
  455. }
  456. return
  457. }
  458. func getListObjectsV2Args(values url.Values) (prefix, startAfter, delimiter string, token OptionalString, encodingTypeUrl bool, fetchOwner bool, maxkeys int) {
  459. prefix = values.Get("prefix")
  460. token = OptionalString{set: values.Has("continuation-token"), string: values.Get("continuation-token")}
  461. startAfter = values.Get("start-after")
  462. delimiter = values.Get("delimiter")
  463. encodingTypeUrl = values.Get("encoding-type") == s3.EncodingTypeUrl
  464. if values.Get("max-keys") != "" {
  465. maxkeys, _ = strconv.Atoi(values.Get("max-keys"))
  466. } else {
  467. maxkeys = maxObjectListSizeLimit
  468. }
  469. fetchOwner = values.Get("fetch-owner") == "true"
  470. return
  471. }
  472. func getListObjectsV1Args(values url.Values) (prefix, marker, delimiter string, encodingTypeUrl bool, maxkeys int) {
  473. prefix = values.Get("prefix")
  474. marker = values.Get("marker")
  475. delimiter = values.Get("delimiter")
  476. encodingTypeUrl = values.Get("encoding-type") == "url"
  477. if values.Get("max-keys") != "" {
  478. maxkeys, _ = strconv.Atoi(values.Get("max-keys"))
  479. } else {
  480. maxkeys = maxObjectListSizeLimit
  481. }
  482. return
  483. }
  484. func (s3a *S3ApiServer) ensureDirectoryAllEmpty(filerClient filer_pb.SeaweedFilerClient, parentDir, name string) (isEmpty bool, err error) {
  485. // println("+ ensureDirectoryAllEmpty", dir, name)
  486. glog.V(4).Infof("+ isEmpty %s/%s", parentDir, name)
  487. defer glog.V(4).Infof("- isEmpty %s/%s %v", parentDir, name, isEmpty)
  488. var fileCounter int
  489. var subDirs []string
  490. currentDir := parentDir + "/" + name
  491. var startFrom string
  492. var isExhausted bool
  493. var foundEntry bool
  494. for fileCounter == 0 && !isExhausted && err == nil {
  495. err = filer_pb.SeaweedList(filerClient, currentDir, "", func(entry *filer_pb.Entry, isLast bool) error {
  496. foundEntry = true
  497. if entry.IsOlderDir() {
  498. subDirs = append(subDirs, entry.Name)
  499. } else {
  500. fileCounter++
  501. }
  502. startFrom = entry.Name
  503. isExhausted = isExhausted || isLast
  504. glog.V(4).Infof(" * %s/%s isLast: %t", currentDir, startFrom, isLast)
  505. return nil
  506. }, startFrom, false, 8)
  507. if !foundEntry {
  508. break
  509. }
  510. }
  511. if err != nil {
  512. return false, err
  513. }
  514. if fileCounter > 0 {
  515. return false, nil
  516. }
  517. for _, subDir := range subDirs {
  518. isSubEmpty, subErr := s3a.ensureDirectoryAllEmpty(filerClient, currentDir, subDir)
  519. if subErr != nil {
  520. return false, subErr
  521. }
  522. if !isSubEmpty {
  523. return false, nil
  524. }
  525. }
  526. glog.V(1).Infof("deleting empty folder %s", currentDir)
  527. if err = doDeleteEntry(filerClient, parentDir, name, true, false); err != nil {
  528. return
  529. }
  530. return true, nil
  531. }