Spaces:

un-index
/

textgen6b

Sleeping

App Files Files Community

un-index commited on Dec 22, 2021

Commit

45d20de

1 Parent(s): 0ddb594

t

Browse files

Files changed (1) hide show

app.py +4 -3

app.py CHANGED Viewed

@@ -121,6 +121,7 @@ def f(context, temperature, top_p, max_length, model_idx, SPACE_VERIFICATION_KEY
                 "token_max_length": max_length,  # 512,
                 "temperature": temperature,
                 "top_p": top_p,
             }
             response = requests.post(
@@ -143,7 +144,7 @@ def f(context, temperature, top_p, max_length, model_idx, SPACE_VERIFICATION_KEY
                 # todo fix max_length below, maybe there is a max_new_tokens parameter
                 # try max_length=len(context)+max_length or =len(context)+max_length or make max_length inf or unspecified
                 # note: added max_new_tokens parameter to see whether it actually works, if not remove,
-                # if yes, then make max_length infinite because it seems to be counted as max input length, not output
                 generated_text = generator(context, max_length=400, max_new_tokens=max_length, top_p=top_p, temperature=temperature, num_return_sequences=1)
             except Exception as e:
                 return "Exception while generating text: " + str(e)
@@ -156,7 +157,7 @@ def f(context, temperature, top_p, max_length, model_idx, SPACE_VERIFICATION_KEY
                     return generated_text[0][0]['generated_text']
             except:
                 return generated_text # was error due to timeout because of not enabling queue in gradio interface?
             # except:
                 # generated_text = generator(context, max_length=max_length, top_p=top_p, temperature=temperature, num_return_sequences=1)[0]
@@ -168,7 +169,7 @@ def f(context, temperature, top_p, max_length, model_idx, SPACE_VERIFICATION_KEY
     except Exception as e:
-        return f"error with idx{model_idx} : \n"+str(e)
 iface = gr.Interface(f, [

                 "token_max_length": max_length,  # 512,
                 "temperature": temperature,
                 "top_p": top_p,
+                "max_time": 120.0
             }
             response = requests.post(
                 # todo fix max_length below, maybe there is a max_new_tokens parameter
                 # try max_length=len(context)+max_length or =len(context)+max_length or make max_length inf or unspecified
                 # note: added max_new_tokens parameter to see whether it actually works, if not remove,
+                # TODO if yes, then make max_length infinite because it seems to be counted as max input length, not output
                 generated_text = generator(context, max_length=400, max_new_tokens=max_length, top_p=top_p, temperature=temperature, num_return_sequences=1)
             except Exception as e:
                 return "Exception while generating text: " + str(e)
                     return generated_text[0][0]['generated_text']
             except:
                 return generated_text # was error due to timeout because of not enabling queue in gradio interface?
+                # if it works right now, then that was the reason for the JSON parsing error
             # except:
                 # generated_text = generator(context, max_length=max_length, top_p=top_p, temperature=temperature, num_return_sequences=1)[0]
     except Exception as e:
+        return f"error with idx{model_idx}: "+str(e)
 iface = gr.Interface(f, [