s3api_object_handlers.go 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565
  1. package s3api
  2. import (
  3. "bytes"
  4. "crypto/md5"
  5. "encoding/json"
  6. "encoding/xml"
  7. "fmt"
  8. "io"
  9. "net/http"
  10. "net/url"
  11. "strings"
  12. "time"
  13. "github.com/seaweedfs/seaweedfs/weed/s3api/s3_constants"
  14. "github.com/seaweedfs/seaweedfs/weed/security"
  15. "github.com/seaweedfs/seaweedfs/weed/util/mem"
  16. "golang.org/x/exp/slices"
  17. "github.com/pquerna/cachecontrol/cacheobject"
  18. "github.com/seaweedfs/seaweedfs/weed/filer"
  19. "github.com/seaweedfs/seaweedfs/weed/s3api/s3err"
  20. "github.com/seaweedfs/seaweedfs/weed/glog"
  21. "github.com/seaweedfs/seaweedfs/weed/pb/filer_pb"
  22. weed_server "github.com/seaweedfs/seaweedfs/weed/server"
  23. "github.com/seaweedfs/seaweedfs/weed/util"
  24. )
  25. const (
  26. deleteMultipleObjectsLimit = 1000
  27. )
  28. func mimeDetect(r *http.Request, dataReader io.Reader) io.ReadCloser {
  29. mimeBuffer := make([]byte, 512)
  30. size, _ := dataReader.Read(mimeBuffer)
  31. if size > 0 {
  32. r.Header.Set("Content-Type", http.DetectContentType(mimeBuffer[:size]))
  33. return io.NopCloser(io.MultiReader(bytes.NewReader(mimeBuffer[:size]), dataReader))
  34. }
  35. return io.NopCloser(dataReader)
  36. }
  37. func (s3a *S3ApiServer) PutObjectHandler(w http.ResponseWriter, r *http.Request) {
  38. // http://docs.aws.amazon.com/AmazonS3/latest/dev/UploadingObjects.html
  39. bucket, object := s3_constants.GetBucketAndObject(r)
  40. glog.V(3).Infof("PutObjectHandler %s %s", bucket, object)
  41. _, err := validateContentMd5(r.Header)
  42. if err != nil {
  43. s3err.WriteErrorResponse(w, r, s3err.ErrInvalidDigest)
  44. return
  45. }
  46. if r.Header.Get("Cache-Control") != "" {
  47. if _, err = cacheobject.ParseRequestCacheControl(r.Header.Get("Cache-Control")); err != nil {
  48. s3err.WriteErrorResponse(w, r, s3err.ErrInvalidDigest)
  49. return
  50. }
  51. }
  52. if r.Header.Get("Expires") != "" {
  53. if _, err = time.Parse(http.TimeFormat, r.Header.Get("Expires")); err != nil {
  54. s3err.WriteErrorResponse(w, r, s3err.ErrMalformedDate)
  55. return
  56. }
  57. }
  58. dataReader := r.Body
  59. rAuthType := getRequestAuthType(r)
  60. if s3a.iam.isEnabled() {
  61. var s3ErrCode s3err.ErrorCode
  62. switch rAuthType {
  63. case authTypeStreamingSigned:
  64. dataReader, s3ErrCode = s3a.iam.newSignV4ChunkedReader(r)
  65. case authTypeSignedV2, authTypePresignedV2:
  66. _, s3ErrCode = s3a.iam.isReqAuthenticatedV2(r)
  67. case authTypePresigned, authTypeSigned:
  68. _, s3ErrCode = s3a.iam.reqSignatureV4Verify(r)
  69. }
  70. if s3ErrCode != s3err.ErrNone {
  71. s3err.WriteErrorResponse(w, r, s3ErrCode)
  72. return
  73. }
  74. } else {
  75. if authTypeStreamingSigned == rAuthType {
  76. s3err.WriteErrorResponse(w, r, s3err.ErrAuthNotSetup)
  77. return
  78. }
  79. }
  80. defer dataReader.Close()
  81. objectContentType := r.Header.Get("Content-Type")
  82. if strings.HasSuffix(object, "/") && r.ContentLength <= 1024 {
  83. if err := s3a.mkdir(
  84. s3a.option.BucketsPath, bucket+strings.TrimSuffix(object, "/"),
  85. func(entry *filer_pb.Entry) {
  86. if objectContentType == "" {
  87. objectContentType = s3_constants.FolderMimeType
  88. }
  89. if r.ContentLength > 0 {
  90. entry.Content, _ = io.ReadAll(r.Body)
  91. }
  92. entry.Attributes.Mime = objectContentType
  93. }); err != nil {
  94. s3err.WriteErrorResponse(w, r, s3err.ErrInternalError)
  95. return
  96. }
  97. } else {
  98. uploadUrl := s3a.toFilerUrl(bucket, object)
  99. if objectContentType == "" {
  100. dataReader = mimeDetect(r, dataReader)
  101. }
  102. etag, errCode := s3a.putToFiler(r, uploadUrl, dataReader, "", bucket)
  103. if errCode != s3err.ErrNone {
  104. s3err.WriteErrorResponse(w, r, errCode)
  105. return
  106. }
  107. setEtag(w, etag)
  108. }
  109. writeSuccessResponseEmpty(w, r)
  110. }
  111. func urlEscapeObject(object string) string {
  112. t := urlPathEscape(removeDuplicateSlashes(object))
  113. if strings.HasPrefix(t, "/") {
  114. return t
  115. }
  116. return "/" + t
  117. }
  118. func urlPathEscape(object string) string {
  119. var escapedParts []string
  120. for _, part := range strings.Split(object, "/") {
  121. escapedParts = append(escapedParts, url.PathEscape(part))
  122. }
  123. return strings.Join(escapedParts, "/")
  124. }
  125. func removeDuplicateSlashes(object string) string {
  126. result := strings.Builder{}
  127. result.Grow(len(object))
  128. isLastSlash := false
  129. for _, r := range object {
  130. switch r {
  131. case '/':
  132. if !isLastSlash {
  133. result.WriteRune(r)
  134. }
  135. isLastSlash = true
  136. default:
  137. result.WriteRune(r)
  138. isLastSlash = false
  139. }
  140. }
  141. return result.String()
  142. }
  143. func (s3a *S3ApiServer) toFilerUrl(bucket, object string) string {
  144. object = urlPathEscape(removeDuplicateSlashes(object))
  145. destUrl := fmt.Sprintf("http://%s%s/%s%s",
  146. s3a.option.Filer.ToHttpAddress(), s3a.option.BucketsPath, bucket, object)
  147. return destUrl
  148. }
  149. func (s3a *S3ApiServer) GetObjectHandler(w http.ResponseWriter, r *http.Request) {
  150. bucket, object := s3_constants.GetBucketAndObject(r)
  151. glog.V(3).Infof("GetObjectHandler %s %s", bucket, object)
  152. if strings.HasSuffix(r.URL.Path, "/") {
  153. s3err.WriteErrorResponse(w, r, s3err.ErrNotImplemented)
  154. return
  155. }
  156. destUrl := s3a.toFilerUrl(bucket, object)
  157. s3a.proxyToFiler(w, r, destUrl, false, passThroughResponse)
  158. }
  159. func (s3a *S3ApiServer) HeadObjectHandler(w http.ResponseWriter, r *http.Request) {
  160. bucket, object := s3_constants.GetBucketAndObject(r)
  161. glog.V(3).Infof("HeadObjectHandler %s %s", bucket, object)
  162. destUrl := s3a.toFilerUrl(bucket, object)
  163. s3a.proxyToFiler(w, r, destUrl, false, passThroughResponse)
  164. }
  165. func (s3a *S3ApiServer) DeleteObjectHandler(w http.ResponseWriter, r *http.Request) {
  166. bucket, object := s3_constants.GetBucketAndObject(r)
  167. glog.V(3).Infof("DeleteObjectHandler %s %s", bucket, object)
  168. destUrl := s3a.toFilerUrl(bucket, object)
  169. s3a.proxyToFiler(w, r, destUrl, true, func(proxyResponse *http.Response, w http.ResponseWriter) (statusCode int) {
  170. statusCode = http.StatusNoContent
  171. for k, v := range proxyResponse.Header {
  172. w.Header()[k] = v
  173. }
  174. w.WriteHeader(statusCode)
  175. return statusCode
  176. })
  177. }
  178. // / ObjectIdentifier carries key name for the object to delete.
  179. type ObjectIdentifier struct {
  180. ObjectName string `xml:"Key"`
  181. }
  182. // DeleteObjectsRequest - xml carrying the object key names which needs to be deleted.
  183. type DeleteObjectsRequest struct {
  184. // Element to enable quiet mode for the request
  185. Quiet bool
  186. // List of objects to be deleted
  187. Objects []ObjectIdentifier `xml:"Object"`
  188. }
  189. // DeleteError structure.
  190. type DeleteError struct {
  191. Code string
  192. Message string
  193. Key string
  194. }
  195. // DeleteObjectsResponse container for multiple object deletes.
  196. type DeleteObjectsResponse struct {
  197. XMLName xml.Name `xml:"http://s3.amazonaws.com/doc/2006-03-01/ DeleteResult" json:"-"`
  198. // Collection of all deleted objects
  199. DeletedObjects []ObjectIdentifier `xml:"Deleted,omitempty"`
  200. // Collection of errors deleting certain objects.
  201. Errors []DeleteError `xml:"Error,omitempty"`
  202. }
  203. // DeleteMultipleObjectsHandler - Delete multiple objects
  204. func (s3a *S3ApiServer) DeleteMultipleObjectsHandler(w http.ResponseWriter, r *http.Request) {
  205. bucket, _ := s3_constants.GetBucketAndObject(r)
  206. glog.V(3).Infof("DeleteMultipleObjectsHandler %s", bucket)
  207. deleteXMLBytes, err := io.ReadAll(r.Body)
  208. if err != nil {
  209. s3err.WriteErrorResponse(w, r, s3err.ErrInternalError)
  210. return
  211. }
  212. deleteObjects := &DeleteObjectsRequest{}
  213. if err := xml.Unmarshal(deleteXMLBytes, deleteObjects); err != nil {
  214. s3err.WriteErrorResponse(w, r, s3err.ErrMalformedXML)
  215. return
  216. }
  217. if len(deleteObjects.Objects) > deleteMultipleObjectsLimit {
  218. s3err.WriteErrorResponse(w, r, s3err.ErrInvalidMaxDeleteObjects)
  219. return
  220. }
  221. var deletedObjects []ObjectIdentifier
  222. var deleteErrors []DeleteError
  223. var auditLog *s3err.AccessLog
  224. directoriesWithDeletion := make(map[string]int)
  225. if s3err.Logger != nil {
  226. auditLog = s3err.GetAccessLog(r, http.StatusNoContent, s3err.ErrNone)
  227. }
  228. s3a.WithFilerClient(false, func(client filer_pb.SeaweedFilerClient) error {
  229. // delete file entries
  230. for _, object := range deleteObjects.Objects {
  231. if object.ObjectName == "" {
  232. continue
  233. }
  234. lastSeparator := strings.LastIndex(object.ObjectName, "/")
  235. parentDirectoryPath, entryName, isDeleteData, isRecursive := "", object.ObjectName, true, false
  236. if lastSeparator > 0 && lastSeparator+1 < len(object.ObjectName) {
  237. entryName = object.ObjectName[lastSeparator+1:]
  238. parentDirectoryPath = "/" + object.ObjectName[:lastSeparator]
  239. }
  240. parentDirectoryPath = fmt.Sprintf("%s/%s%s", s3a.option.BucketsPath, bucket, parentDirectoryPath)
  241. err := doDeleteEntry(client, parentDirectoryPath, entryName, isDeleteData, isRecursive)
  242. if err == nil {
  243. directoriesWithDeletion[parentDirectoryPath]++
  244. deletedObjects = append(deletedObjects, object)
  245. } else if strings.Contains(err.Error(), filer.MsgFailDelNonEmptyFolder) {
  246. deletedObjects = append(deletedObjects, object)
  247. } else {
  248. delete(directoriesWithDeletion, parentDirectoryPath)
  249. deleteErrors = append(deleteErrors, DeleteError{
  250. Code: "",
  251. Message: err.Error(),
  252. Key: object.ObjectName,
  253. })
  254. }
  255. if auditLog != nil {
  256. auditLog.Key = entryName
  257. s3err.PostAccessLog(*auditLog)
  258. }
  259. }
  260. // purge empty folders, only checking folders with deletions
  261. for len(directoriesWithDeletion) > 0 {
  262. directoriesWithDeletion = s3a.doDeleteEmptyDirectories(client, directoriesWithDeletion)
  263. }
  264. return nil
  265. })
  266. deleteResp := DeleteObjectsResponse{}
  267. if !deleteObjects.Quiet {
  268. deleteResp.DeletedObjects = deletedObjects
  269. }
  270. deleteResp.Errors = deleteErrors
  271. writeSuccessResponseXML(w, r, deleteResp)
  272. }
  273. func (s3a *S3ApiServer) doDeleteEmptyDirectories(client filer_pb.SeaweedFilerClient, directoriesWithDeletion map[string]int) (newDirectoriesWithDeletion map[string]int) {
  274. var allDirs []string
  275. for dir := range directoriesWithDeletion {
  276. allDirs = append(allDirs, dir)
  277. }
  278. slices.SortFunc(allDirs, func(a, b string) int {
  279. return len(b) - len(a)
  280. })
  281. newDirectoriesWithDeletion = make(map[string]int)
  282. for _, dir := range allDirs {
  283. parentDir, dirName := util.FullPath(dir).DirAndName()
  284. if parentDir == s3a.option.BucketsPath {
  285. continue
  286. }
  287. if err := doDeleteEntry(client, parentDir, dirName, false, false); err != nil {
  288. glog.V(4).Infof("directory %s has %d deletion but still not empty: %v", dir, directoriesWithDeletion[dir], err)
  289. } else {
  290. newDirectoriesWithDeletion[parentDir]++
  291. }
  292. }
  293. return
  294. }
  295. func (s3a *S3ApiServer) proxyToFiler(w http.ResponseWriter, r *http.Request, destUrl string, isWrite bool, responseFn func(proxyResponse *http.Response, w http.ResponseWriter) (statusCode int)) {
  296. glog.V(3).Infof("s3 proxying %s to %s", r.Method, destUrl)
  297. start := time.Now()
  298. proxyReq, err := http.NewRequest(r.Method, destUrl, r.Body)
  299. if err != nil {
  300. glog.Errorf("NewRequest %s: %v", destUrl, err)
  301. s3err.WriteErrorResponse(w, r, s3err.ErrInternalError)
  302. return
  303. }
  304. proxyReq.Header.Set("X-Forwarded-For", r.RemoteAddr)
  305. for k, v := range r.URL.Query() {
  306. if _, ok := s3_constants.PassThroughHeaders[strings.ToLower(k)]; ok {
  307. proxyReq.Header[k] = v
  308. }
  309. }
  310. for header, values := range r.Header {
  311. proxyReq.Header[header] = values
  312. }
  313. // ensure that the Authorization header is overriding any previous
  314. // Authorization header which might be already present in proxyReq
  315. s3a.maybeAddFilerJwtAuthorization(proxyReq, isWrite)
  316. resp, postErr := s3a.client.Do(proxyReq)
  317. if postErr != nil {
  318. glog.Errorf("post to filer: %v", postErr)
  319. s3err.WriteErrorResponse(w, r, s3err.ErrInternalError)
  320. return
  321. }
  322. defer util.CloseResponse(resp)
  323. if resp.StatusCode == http.StatusPreconditionFailed {
  324. s3err.WriteErrorResponse(w, r, s3err.ErrPreconditionFailed)
  325. return
  326. }
  327. if resp.StatusCode == http.StatusRequestedRangeNotSatisfiable {
  328. s3err.WriteErrorResponse(w, r, s3err.ErrInvalidRange)
  329. return
  330. }
  331. if r.Method == "DELETE" {
  332. if resp.StatusCode == http.StatusNotFound {
  333. // this is normal
  334. responseStatusCode := responseFn(resp, w)
  335. s3err.PostLog(r, responseStatusCode, s3err.ErrNone)
  336. return
  337. }
  338. }
  339. if resp.StatusCode == http.StatusNotFound {
  340. s3err.WriteErrorResponse(w, r, s3err.ErrNoSuchKey)
  341. return
  342. }
  343. TimeToFirstByte(r.Method, start, r)
  344. if resp.Header.Get(s3_constants.X_SeaweedFS_Header_Directory_Key) == "true" {
  345. responseStatusCode := responseFn(resp, w)
  346. s3err.PostLog(r, responseStatusCode, s3err.ErrNone)
  347. return
  348. }
  349. if resp.StatusCode == http.StatusInternalServerError {
  350. s3err.WriteErrorResponse(w, r, s3err.ErrInternalError)
  351. return
  352. }
  353. // when HEAD a directory, it should be reported as no such key
  354. // https://github.com/seaweedfs/seaweedfs/issues/3457
  355. if resp.ContentLength == -1 && resp.StatusCode != http.StatusNotModified {
  356. s3err.WriteErrorResponse(w, r, s3err.ErrNoSuchKey)
  357. return
  358. }
  359. setUserMetadataKeyToLowercase(resp)
  360. responseStatusCode := responseFn(resp, w)
  361. s3err.PostLog(r, responseStatusCode, s3err.ErrNone)
  362. }
  363. func setUserMetadataKeyToLowercase(resp *http.Response) {
  364. for key, value := range resp.Header {
  365. if strings.HasPrefix(key, s3_constants.AmzUserMetaPrefix) {
  366. resp.Header[strings.ToLower(key)] = value
  367. delete(resp.Header, key)
  368. }
  369. }
  370. }
  371. func passThroughResponse(proxyResponse *http.Response, w http.ResponseWriter) (statusCode int) {
  372. for k, v := range proxyResponse.Header {
  373. w.Header()[k] = v
  374. }
  375. if proxyResponse.Header.Get("Content-Range") != "" && proxyResponse.StatusCode == 200 {
  376. w.WriteHeader(http.StatusPartialContent)
  377. statusCode = http.StatusPartialContent
  378. } else {
  379. statusCode = proxyResponse.StatusCode
  380. }
  381. w.WriteHeader(statusCode)
  382. buf := mem.Allocate(128 * 1024)
  383. defer mem.Free(buf)
  384. if n, err := io.CopyBuffer(w, proxyResponse.Body, buf); err != nil {
  385. glog.V(1).Infof("passthrough response read %d bytes: %v", n, err)
  386. }
  387. return statusCode
  388. }
  389. func (s3a *S3ApiServer) putToFiler(r *http.Request, uploadUrl string, dataReader io.Reader, destination string, bucket string) (etag string, code s3err.ErrorCode) {
  390. hash := md5.New()
  391. var body = io.TeeReader(dataReader, hash)
  392. proxyReq, err := http.NewRequest("PUT", uploadUrl, body)
  393. if err != nil {
  394. glog.Errorf("NewRequest %s: %v", uploadUrl, err)
  395. return "", s3err.ErrInternalError
  396. }
  397. proxyReq.Header.Set("X-Forwarded-For", r.RemoteAddr)
  398. if destination != "" {
  399. proxyReq.Header.Set(s3_constants.SeaweedStorageDestinationHeader, destination)
  400. }
  401. if s3a.option.FilerGroup != "" {
  402. query := proxyReq.URL.Query()
  403. query.Add("collection", s3a.getCollectionName(bucket))
  404. proxyReq.URL.RawQuery = query.Encode()
  405. }
  406. for header, values := range r.Header {
  407. for _, value := range values {
  408. proxyReq.Header.Add(header, value)
  409. }
  410. }
  411. // ensure that the Authorization header is overriding any previous
  412. // Authorization header which might be already present in proxyReq
  413. s3a.maybeAddFilerJwtAuthorization(proxyReq, true)
  414. resp, postErr := s3a.client.Do(proxyReq)
  415. if postErr != nil {
  416. glog.Errorf("post to filer: %v", postErr)
  417. return "", s3err.ErrInternalError
  418. }
  419. defer resp.Body.Close()
  420. etag = fmt.Sprintf("%x", hash.Sum(nil))
  421. resp_body, ra_err := io.ReadAll(resp.Body)
  422. if ra_err != nil {
  423. glog.Errorf("upload to filer response read %d: %v", resp.StatusCode, ra_err)
  424. return etag, s3err.ErrInternalError
  425. }
  426. var ret weed_server.FilerPostResult
  427. unmarshal_err := json.Unmarshal(resp_body, &ret)
  428. if unmarshal_err != nil {
  429. glog.Errorf("failing to read upload to %s : %v", uploadUrl, string(resp_body))
  430. return "", s3err.ErrInternalError
  431. }
  432. if ret.Error != "" {
  433. glog.Errorf("upload to filer error: %v", ret.Error)
  434. return "", filerErrorToS3Error(ret.Error)
  435. }
  436. return etag, s3err.ErrNone
  437. }
  438. func setEtag(w http.ResponseWriter, etag string) {
  439. if etag != "" {
  440. if strings.HasPrefix(etag, "\"") {
  441. w.Header()["ETag"] = []string{etag}
  442. } else {
  443. w.Header()["ETag"] = []string{"\"" + etag + "\""}
  444. }
  445. }
  446. }
  447. func filerErrorToS3Error(errString string) s3err.ErrorCode {
  448. switch {
  449. case strings.HasPrefix(errString, "existing ") && strings.HasSuffix(errString, "is a directory"):
  450. return s3err.ErrExistingObjectIsDirectory
  451. case strings.HasSuffix(errString, "is a file"):
  452. return s3err.ErrExistingObjectIsFile
  453. default:
  454. return s3err.ErrInternalError
  455. }
  456. }
  457. func (s3a *S3ApiServer) maybeAddFilerJwtAuthorization(r *http.Request, isWrite bool) {
  458. encodedJwt := s3a.maybeGetFilerJwtAuthorizationToken(isWrite)
  459. if encodedJwt == "" {
  460. return
  461. }
  462. r.Header.Set("Authorization", "BEARER "+string(encodedJwt))
  463. }
  464. func (s3a *S3ApiServer) maybeGetFilerJwtAuthorizationToken(isWrite bool) string {
  465. var encodedJwt security.EncodedJwt
  466. if isWrite {
  467. encodedJwt = security.GenJwtForFilerServer(s3a.filerGuard.SigningKey, s3a.filerGuard.ExpiresAfterSec)
  468. } else {
  469. encodedJwt = security.GenJwtForFilerServer(s3a.filerGuard.ReadSigningKey, s3a.filerGuard.ReadExpiresAfterSec)
  470. }
  471. return string(encodedJwt)
  472. }